{ "schemaVersion": 1, "deviceProperties": [ { "id": 0, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 1, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 2, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 3, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 4, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 5, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 6, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 }, { "id": 7, "name": "NVIDIA H200", "totalGlobalMem": 149631664128, "computeMajor": 9, "computeMinor": 0, "maxThreadsPerBlock": 1024, "maxThreadsPerMultiprocessor": 2048, "regsPerBlock": 65536, "warpSize": 32, "sharedMemPerBlock": 49152, "numSms": 132 , "regsPerMultiprocessor": 65536, "sharedMemPerBlockOptin": 232448, "sharedMemPerMultiprocessor": 233472 } ], "cupti_version": 22, "cuda_runtime_version": 12040, "cuda_driver_version": 12080, "distributedInfo": {"backend": "nccl", "rank": 1, "world_size": 8, "pg_count": 1, "pg_config": [{"pg_name": "0", "pg_desc": "default_pg", "backend_config": "cuda:nccl", "pg_size": 8, "ranks": [0, 1, 2, 3, 4, 5, 6, 7]}], "nccl_version": "2.21.5"}, "record_shapes": 1, "trace_id": "87C9E3DDAB0E48DC981F6913E327958F", "traceEvents": [ { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: DivBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650730526.478, "dur": 112.769, "args": { "External id": 17409,"Record function id": 0, "Sequence number": 246770, "Fwd thread id": 1, "Ev Idx": 0 } }, { "ph": "X", "cat": "cpu_op", "name": "DivBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650730545.067, "dur": 85.616, "args": { "External id": 17410,"Sequence number": 246770, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 1 } }, { "ph": "f", "id": 1, "pid": 1336754, "tid": 1381179, "ts": 1295650730545.067, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336754, "tid": 1381179, "ts": 1295650730552.101, "dur": 76.542, "args": { "External id": 17411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 2 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650730652.465, "dur": 196.561, "args": { "External id": 17412,"Record function id": 0, "Ev Idx": 3 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650730704.700, "dur": 80.382, "args": { "External id": 17413,"Record function id": 0, "Ev Idx": 4 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.27", "pid": 1336754, "tid": 1381179, "ts": 1295650730733.228, "dur": 40.823, "args": { "External id": 17414,"Record function id": 0, "Ev Idx": 5 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650730790.111, "dur": 1.561, "args": { "External id": 17415,"Sequence number": 246769, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 6 } }, { "ph": "f", "id": 2, "pid": 1336754, "tid": 1381179, "ts": 1295650730790.111, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650730795.127, "dur": 49.549, "args": { "External id": 17416,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 7 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650730803.748, "dur": 40.424, "args": { "External id": 17417,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 8 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650730812.078, "dur": 2.351, "args": { "External id": 17418,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650730857.548, "dur": 36398.061, "args": { "External id": 17419,"Record function id": 0, "Sequence number": 246767, "Fwd thread id": 1, "Ev Idx": 10 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650730859.050, "dur": 36383.043, "args": { "External id": 17420,"Sequence number": 246767, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11 } }, { "ph": "f", "id": 3, "pid": 1336754, "tid": 1381179, "ts": 1295650730859.050, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650730897.202, "dur": 3.705, "args": { "External id": 17421,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 12 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650730903.746, "dur": 36203.773, "args": { "External id": 17422,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 13 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650730908.332, "dur": 36198.754, "args": { "External id": 17423,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 14 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650730911.658, "dur": 6.804, "args": { "External id": 17424,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 15 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650730920.064, "dur": 36184.900, "args": { "External id": 17425,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 16 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336754, "tid": 1381179, "ts": 1295650767113.518, "dur": 0.670, "args": { "External id": 17426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 17 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650767117.021, "dur": 3.329, "args": { "External id": 17427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 18 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650767118.779, "dur": 1.362, "args": { "External id": 17428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 19 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1381179, "ts": 1295650767127.338, "dur": 36.616, "args": { "External id": 17429,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 20 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1381179, "ts": 1295650767171.902, "dur": 47.589, "args": { "External id": 17430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 21 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1381179, "ts": 1295650767173.615, "dur": 45.665, "args": { "External id": 17431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 22 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1381179, "ts": 1295650767175.320, "dur": 43.662, "args": { "External id": 17432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 23 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767268.450, "dur": 17.000, "args": { "External id": 17433,"Record function id": 0, "Sequence number": 246766, "Fwd thread id": 1, "Ev Idx": 24 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767270.462, "dur": 12.119, "args": { "External id": 17434,"Sequence number": 246766, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 25 } }, { "ph": "f", "id": 4, "pid": 1336754, "tid": 1381179, "ts": 1295650767270.462, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650767274.747, "dur": 7.604, "args": { "External id": 17435,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 26 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650767277.210, "dur": 4.932, "args": { "External id": 17436,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 27 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767289.516, "dur": 100.159, "args": { "External id": 17437,"Record function id": 0, "Sequence number": 246765, "Fwd thread id": 1, "Ev Idx": 28 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767290.662, "dur": 92.239, "args": { "External id": 17438,"Sequence number": 246765, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 29 } }, { "ph": "f", "id": 5, "pid": 1336754, "tid": 1381179, "ts": 1295650767290.662, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650767295.007, "dur": 87.234, "args": { "External id": 17439,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 30 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650767299.882, "dur": 36.094, "args": { "External id": 17440,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 31 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650767302.512, "dur": 5.023, "args": { "External id": 17441,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 32 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650767308.867, "dur": 26.806, "args": { "External id": 17442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 33 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650767313.141, "dur": 22.081, "args": { "External id": 17443,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 34 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650767338.335, "dur": 5.685, "args": { "External id": 17444,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 35 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767341.988, "dur": 1.560, "args": { "External id": 17445,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 36 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650767345.359, "dur": 36.048, "args": { "External id": 17446,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 37 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767394.378, "dur": 60.175, "args": { "External id": 17447,"Record function id": 0, "Sequence number": 246764, "Fwd thread id": 1, "Ev Idx": 38 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767395.563, "dur": 55.722, "args": { "External id": 17448,"Sequence number": 246764, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 39 } }, { "ph": "f", "id": 6, "pid": 1336754, "tid": 1381179, "ts": 1295650767395.563, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650767398.673, "dur": 52.318, "args": { "External id": 17449,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "3"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 40 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650767401.289, "dur": 19.470, "args": { "External id": 17450,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 41 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650767402.596, "dur": 2.837, "args": { "External id": 17451,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 42 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650767406.110, "dur": 14.375, "args": { "External id": 17452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 43 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650767407.168, "dur": 12.984, "args": { "External id": 17453,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 44 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650767424.713, "dur": 6.828, "args": { "External id": 17454,"Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 45 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767429.675, "dur": 1.178, "args": { "External id": 17455,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 46 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650767432.258, "dur": 18.261, "args": { "External id": 17456,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 47 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767459.244, "dur": 126.397, "args": { "External id": 17457,"Record function id": 0, "Sequence number": 246763, "Fwd thread id": 1, "Ev Idx": 48 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767460.363, "dur": 121.497, "args": { "External id": 17458,"Sequence number": 246763, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 49 } }, { "ph": "f", "id": 7, "pid": 1336754, "tid": 1381179, "ts": 1295650767460.363, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650767462.453, "dur": 119.086, "args": { "External id": 17459,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 50 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650767466.167, "dur": 16.939, "args": { "External id": 17460,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 51 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650767467.275, "dur": 2.052, "args": { "External id": 17461,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 52 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650767469.910, "dur": 12.946, "args": { "External id": 17462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 53 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650767471.060, "dur": 11.431, "args": { "External id": 17463,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 54 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650767486.442, "dur": 3.336, "args": { "External id": 17464,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 55 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767488.200, "dur": 1.385, "args": { "External id": 17465,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 56 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650767490.593, "dur": 90.246, "args": { "External id": 17466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 57 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767591.879, "dur": 96.863, "args": { "External id": 17467,"Record function id": 0, "Sequence number": 246762, "Fwd thread id": 1, "Ev Idx": 58 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767593.233, "dur": 92.224, "args": { "External id": 17468,"Sequence number": 246762, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 59 } }, { "ph": "f", "id": 8, "pid": 1336754, "tid": 1381179, "ts": 1295650767593.233, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650767594.655, "dur": 90.486, "args": { "External id": 17469,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 60 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650767596.145, "dur": 19.172, "args": { "External id": 17470,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 61 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650767597.098, "dur": 3.519, "args": { "External id": 17471,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 62 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650767601.253, "dur": 13.795, "args": { "External id": 17472,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 63 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650767602.031, "dur": 12.684, "args": { "External id": 17473,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 64 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650767618.737, "dur": 4.084, "args": { "External id": 17474,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 65 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767622.310, "dur": 0.342, "args": { "External id": 17475,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 66 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650767623.266, "dur": 61.208, "args": { "External id": 17476,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 67 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767692.764, "dur": 35.527, "args": { "External id": 17477,"Record function id": 0, "Sequence number": 246761, "Fwd thread id": 1, "Ev Idx": 68 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650767694.161, "dur": 0.943, "args": { "External id": 17478,"Sequence number": 246761, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 69 } }, { "ph": "f", "id": 9, "pid": 1336754, "tid": 1381179, "ts": 1295650767694.161, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650767697.701, "dur": 27.687, "args": { "External id": 17479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 70 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650767700.560, "dur": 24.241, "args": { "External id": 17480,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 71 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767706.607, "dur": 0.440, "args": { "External id": 17481,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 72 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650767733.197, "dur": 2312.960, "args": { "External id": 17482,"Record function id": 0, "Sequence number": 246759, "Fwd thread id": 1, "Ev Idx": 73 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650767734.726, "dur": 2274.936, "args": { "External id": 17483,"Sequence number": 246759, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 74 } }, { "ph": "f", "id": 10, "pid": 1336754, "tid": 1381179, "ts": 1295650767734.726, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650767772.996, "dur": 3.036, "args": { "External id": 17484,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 75 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650767778.549, "dur": 2115.211, "args": { "External id": 17485,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 76 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650767780.365, "dur": 2113.112, "args": { "External id": 17486,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 77 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650767783.068, "dur": 4.004, "args": { "External id": 17487,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 78 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650767790.623, "dur": 2101.927, "args": { "External id": 17488,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 79 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336754, "tid": 1381179, "ts": 1295650769897.265, "dur": 0.353, "args": { "External id": 17489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 80 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650769899.081, "dur": 2.471, "args": { "External id": 17490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 81 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650769900.348, "dur": 1.080, "args": { "External id": 17491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 82 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1381179, "ts": 1295650769905.941, "dur": 24.281, "args": { "External id": 17492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 83 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1381179, "ts": 1295650769936.013, "dur": 41.322, "args": { "External id": 17493,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 84 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1381179, "ts": 1295650769937.494, "dur": 39.637, "args": { "External id": 17494,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 85 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1381179, "ts": 1295650769939.301, "dur": 37.380, "args": { "External id": 17495,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 86 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650770020.613, "dur": 22.097, "args": { "External id": 17496,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 87 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770054.751, "dur": 14.643, "args": { "External id": 17497,"Record function id": 0, "Sequence number": 246758, "Fwd thread id": 1, "Ev Idx": 88 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770058.513, "dur": 8.698, "args": { "External id": 17498,"Sequence number": 246758, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 89 } }, { "ph": "f", "id": 11, "pid": 1336754, "tid": 1381179, "ts": 1295650770058.513, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650770061.299, "dur": 5.718, "args": { "External id": 17499,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 90 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650770063.008, "dur": 3.867, "args": { "External id": 17500,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 91 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770072.572, "dur": 70.056, "args": { "External id": 17501,"Record function id": 0, "Sequence number": 246757, "Fwd thread id": 1, "Ev Idx": 92 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770073.548, "dur": 64.774, "args": { "External id": 17502,"Sequence number": 246757, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 93 } }, { "ph": "f", "id": 12, "pid": 1336754, "tid": 1381179, "ts": 1295650770073.548, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650770075.879, "dur": 62.113, "args": { "External id": 17503,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 94 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650770078.661, "dur": 23.782, "args": { "External id": 17504,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 95 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650770080.644, "dur": 3.295, "args": { "External id": 17505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 96 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650770084.891, "dur": 17.225, "args": { "External id": 17506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 97 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650770086.206, "dur": 15.486, "args": { "External id": 17507,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 98 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650770103.831, "dur": 6.158, "args": { "External id": 17508,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 99 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770107.066, "dur": 2.678, "args": { "External id": 17509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650770112.789, "dur": 24.395, "args": { "External id": 17510,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770146.691, "dur": 51.992, "args": { "External id": 17511,"Record function id": 0, "Sequence number": 246756, "Fwd thread id": 1, "Ev Idx": 102 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770148.127, "dur": 47.802, "args": { "External id": 17512,"Sequence number": 246756, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 103 } }, { "ph": "f", "id": 13, "pid": 1336754, "tid": 1381179, "ts": 1295650770148.127, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650770150.301, "dur": 45.380, "args": { "External id": 17513,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "2"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650770152.419, "dur": 18.688, "args": { "External id": 17514,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650770153.392, "dur": 2.138, "args": { "External id": 17515,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650770156.400, "dur": 14.447, "args": { "External id": 17516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650770157.106, "dur": 13.321, "args": { "External id": 17517,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650770172.206, "dur": 7.004, "args": { "External id": 17518,"Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770177.818, "dur": 0.857, "args": { "External id": 17519,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650770179.987, "dur": 15.289, "args": { "External id": 17520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770202.531, "dur": 106.924, "args": { "External id": 17521,"Record function id": 0, "Sequence number": 246755, "Fwd thread id": 1, "Ev Idx": 112 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770203.682, "dur": 102.128, "args": { "External id": 17522,"Sequence number": 246755, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 113 } }, { "ph": "f", "id": 14, "pid": 1336754, "tid": 1381179, "ts": 1295650770203.682, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650770205.953, "dur": 99.605, "args": { "External id": 17523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650770207.020, "dur": 15.017, "args": { "External id": 17524,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650770207.868, "dur": 1.875, "args": { "External id": 17525,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650770210.355, "dur": 11.427, "args": { "External id": 17526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650770211.187, "dur": 10.287, "args": { "External id": 17527,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650770223.063, "dur": 16.873, "args": { "External id": 17528,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770227.150, "dur": 12.141, "args": { "External id": 17529,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650770241.227, "dur": 63.573, "args": { "External id": 17530,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770317.386, "dur": 94.789, "args": { "External id": 17531,"Record function id": 0, "Sequence number": 246754, "Fwd thread id": 1, "Ev Idx": 122 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770318.375, "dur": 74.586, "args": { "External id": 17532,"Sequence number": 246754, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 123 } }, { "ph": "f", "id": 15, "pid": 1336754, "tid": 1381179, "ts": 1295650770318.375, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650770320.642, "dur": 72.030, "args": { "External id": 17533,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650770322.365, "dur": 17.419, "args": { "External id": 17534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650770323.396, "dur": 2.584, "args": { "External id": 17535,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650770326.652, "dur": 12.871, "args": { "External id": 17536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650770327.773, "dur": 11.457, "args": { "External id": 17537,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650770340.696, "dur": 2.837, "args": { "External id": 17538,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770342.733, "dur": 0.644, "args": { "External id": 17539,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650770344.050, "dur": 47.963, "args": { "External id": 17540,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650770397.039, "dur": 13.800, "args": { "External id": 17541,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 132 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770418.297, "dur": 32.811, "args": { "External id": 17542,"Record function id": 0, "Sequence number": 246753, "Fwd thread id": 1, "Ev Idx": 133 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650770419.185, "dur": 1.019, "args": { "External id": 17543,"Sequence number": 246753, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 134 } }, { "ph": "f", "id": 16, "pid": 1336754, "tid": 1381179, "ts": 1295650770419.185, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650770421.979, "dur": 26.685, "args": { "External id": 17544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650770424.149, "dur": 23.991, "args": { "External id": 17545,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770429.085, "dur": 2.740, "args": { "External id": 17546,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650770455.510, "dur": 3096.685, "args": { "External id": 17547,"Record function id": 0, "Sequence number": 246751, "Fwd thread id": 1, "Ev Idx": 138 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650770458.984, "dur": 3069.075, "args": { "External id": 17548,"Sequence number": 246751, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 139 } }, { "ph": "f", "id": 17, "pid": 1336754, "tid": 1381179, "ts": 1295650770458.984, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650770486.829, "dur": 2.272, "args": { "External id": 17549,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650770490.943, "dur": 2951.882, "args": { "External id": 17550,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650770492.223, "dur": 2950.261, "args": { "External id": 17551,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650770494.992, "dur": 3.269, "args": { "External id": 17552,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650770499.017, "dur": 2942.630, "args": { "External id": 17553,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336754, "tid": 1381179, "ts": 1295650773445.840, "dur": 0.292, "args": { "External id": 17554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650773447.074, "dur": 4.257, "args": { "External id": 17555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 146 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650773450.257, "dur": 0.919, "args": { "External id": 17556,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1381179, "ts": 1295650773454.979, "dur": 22.133, "args": { "External id": 17557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1381179, "ts": 1295650773482.089, "dur": 39.388, "args": { "External id": 17558,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1381179, "ts": 1295650773483.255, "dur": 38.044, "args": { "External id": 17559,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1381179, "ts": 1295650773484.594, "dur": 36.438, "args": { "External id": 17560,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650773534.527, "dur": 14.747, "args": { "External id": 17561,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773561.541, "dur": 10.789, "args": { "External id": 17562,"Record function id": 0, "Sequence number": 246750, "Fwd thread id": 1, "Ev Idx": 153 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773562.997, "dur": 7.378, "args": { "External id": 17563,"Sequence number": 246750, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 154 } }, { "ph": "f", "id": 18, "pid": 1336754, "tid": 1381179, "ts": 1295650773562.997, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650773565.434, "dur": 4.755, "args": { "External id": 17564,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650773567.097, "dur": 2.986, "args": { "External id": 17565,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773575.689, "dur": 61.443, "args": { "External id": 17566,"Record function id": 0, "Sequence number": 246749, "Fwd thread id": 1, "Ev Idx": 157 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773578.811, "dur": 54.419, "args": { "External id": 17567,"Sequence number": 246749, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 158 } }, { "ph": "f", "id": 19, "pid": 1336754, "tid": 1381179, "ts": 1295650773578.811, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650773581.060, "dur": 51.853, "args": { "External id": 17568,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650773583.901, "dur": 19.694, "args": { "External id": 17569,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650773585.778, "dur": 2.524, "args": { "External id": 17570,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650773588.801, "dur": 14.506, "args": { "External id": 17571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650773590.100, "dur": 12.759, "args": { "External id": 17572,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650773605.044, "dur": 4.087, "args": { "External id": 17573,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773607.789, "dur": 1.042, "args": { "External id": 17574,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650773610.075, "dur": 22.056, "args": { "External id": 17575,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 166 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773640.993, "dur": 52.030, "args": { "External id": 17576,"Record function id": 0, "Sequence number": 246748, "Fwd thread id": 1, "Ev Idx": 167 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773641.949, "dur": 48.677, "args": { "External id": 17577,"Sequence number": 246748, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 168 } }, { "ph": "f", "id": 20, "pid": 1336754, "tid": 1381179, "ts": 1295650773641.949, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650773643.887, "dur": 46.467, "args": { "External id": 17578,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650773647.626, "dur": 17.310, "args": { "External id": 17579,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650773648.726, "dur": 2.234, "args": { "External id": 17580,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650773651.580, "dur": 13.112, "args": { "External id": 17581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650773652.163, "dur": 12.173, "args": { "External id": 17582,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650773665.862, "dur": 6.676, "args": { "External id": 17583,"Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773669.847, "dur": 2.175, "args": { "External id": 17584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650773673.171, "dur": 16.673, "args": { "External id": 17585,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773696.944, "dur": 87.689, "args": { "External id": 17586,"Record function id": 0, "Sequence number": 246747, "Fwd thread id": 1, "Ev Idx": 177 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773697.987, "dur": 84.010, "args": { "External id": 17587,"Sequence number": 246747, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 178 } }, { "ph": "f", "id": 21, "pid": 1336754, "tid": 1381179, "ts": 1295650773697.987, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650773699.643, "dur": 82.006, "args": { "External id": 17588,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650773700.848, "dur": 17.778, "args": { "External id": 17589,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650773703.610, "dur": 1.973, "args": { "External id": 17590,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650773706.161, "dur": 12.205, "args": { "External id": 17591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650773706.877, "dur": 11.086, "args": { "External id": 17592,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650773719.346, "dur": 2.280, "args": { "External id": 17593,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773720.902, "dur": 0.557, "args": { "External id": 17594,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650773722.295, "dur": 58.706, "args": { "External id": 17595,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 186 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773788.646, "dur": 98.141, "args": { "External id": 17596,"Record function id": 0, "Sequence number": 246746, "Fwd thread id": 1, "Ev Idx": 187 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773789.474, "dur": 79.554, "args": { "External id": 17597,"Sequence number": 246746, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 188 } }, { "ph": "f", "id": 22, "pid": 1336754, "tid": 1381179, "ts": 1295650773789.474, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650773793.570, "dur": 75.147, "args": { "External id": 17598,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650773794.603, "dur": 17.180, "args": { "External id": 17599,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650773797.589, "dur": 1.696, "args": { "External id": 17600,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650773799.783, "dur": 11.749, "args": { "External id": 17601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650773800.935, "dur": 10.290, "args": { "External id": 17602,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650773812.605, "dur": 2.354, "args": { "External id": 17603,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773814.375, "dur": 0.412, "args": { "External id": 17604,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650773815.625, "dur": 52.538, "args": { "External id": 17605,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650773872.466, "dur": 13.192, "args": { "External id": 17606,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 197 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773891.062, "dur": 29.145, "args": { "External id": 17607,"Record function id": 0, "Sequence number": 246745, "Fwd thread id": 1, "Ev Idx": 198 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650773892.186, "dur": 1.107, "args": { "External id": 17608,"Sequence number": 246745, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 199 } }, { "ph": "f", "id": 23, "pid": 1336754, "tid": 1381179, "ts": 1295650773892.186, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650773894.849, "dur": 21.688, "args": { "External id": 17609,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650773896.724, "dur": 19.356, "args": { "External id": 17610,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[1], [], [], []], "Ev Idx": 201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773901.042, "dur": 0.365, "args": { "External id": 17611,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 202 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650773924.390, "dur": 3154.876, "args": { "External id": 17612,"Record function id": 0, "Sequence number": 246744, "Fwd thread id": 1, "Ev Idx": 203 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650773934.592, "dur": 3114.232, "args": { "External id": 17613,"Sequence number": 246744, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 204 } }, { "ph": "f", "id": 24, "pid": 1336754, "tid": 1381179, "ts": 1295650773934.592, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650773960.852, "dur": 1.803, "args": { "External id": 17614,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650773964.632, "dur": 2980.639, "args": { "External id": 17615,"Record function id": 0, "Concrete Inputs": ["", "", "6", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650773965.986, "dur": 2978.892, "args": { "External id": 17616,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650773968.609, "dur": 2.695, "args": { "External id": 17617,"Record function id": 0, "Concrete Inputs": ["[]", "[]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650773972.118, "dur": 2971.908, "args": { "External id": 17618,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::lift_fresh", "pid": 1336754, "tid": 1381179, "ts": 1295650776948.582, "dur": 0.282, "args": { "External id": 17619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650776949.806, "dur": 2.250, "args": { "External id": 17620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 211 } }, { "ph": "X", "cat": "cpu_op", "name": "detach_", "pid": 1336754, "tid": 1381179, "ts": 1295650776951.064, "dur": 0.847, "args": { "External id": 17621,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1381179, "ts": 1295650776955.243, "dur": 21.881, "args": { "External id": 17622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1381179, "ts": 1295650777002.701, "dur": 38.883, "args": { "External id": 17623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1381179, "ts": 1295650777003.937, "dur": 37.472, "args": { "External id": 17624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1381179, "ts": 1295650777005.414, "dur": 35.369, "args": { "External id": 17625,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650777058.392, "dur": 16.942, "args": { "External id": 17626,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650777090.248, "dur": 12.097, "args": { "External id": 17627,"Record function id": 0, "Ev Idx": 218 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650777093.239, "dur": 7.690, "args": { "External id": 17628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650777096.237, "dur": 3.829, "args": { "External id": 17629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 220 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650777097.217, "dur": 2.751, "args": { "External id": 17630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 221 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777105.646, "dur": 9.863, "args": { "External id": 17631,"Record function id": 0, "Sequence number": 246743, "Fwd thread id": 1, "Ev Idx": 222 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777106.710, "dur": 6.938, "args": { "External id": 17632,"Sequence number": 246743, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 223 } }, { "ph": "f", "id": 25, "pid": 1336754, "tid": 1381179, "ts": 1295650777106.710, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650777109.255, "dur": 4.192, "args": { "External id": 17633,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650777111.009, "dur": 2.332, "args": { "External id": 17634,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 225 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777118.752, "dur": 62.858, "args": { "External id": 17635,"Record function id": 0, "Sequence number": 246742, "Fwd thread id": 1, "Ev Idx": 226 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777121.949, "dur": 55.534, "args": { "External id": 17636,"Sequence number": 246742, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 227 } }, { "ph": "f", "id": 26, "pid": 1336754, "tid": 1381179, "ts": 1295650777121.949, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650777124.047, "dur": 53.098, "args": { "External id": 17637,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650777126.408, "dur": 21.162, "args": { "External id": 17638,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650777128.003, "dur": 2.729, "args": { "External id": 17639,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650777131.572, "dur": 15.734, "args": { "External id": 17640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650777132.932, "dur": 13.895, "args": { "External id": 17641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650777148.955, "dur": 4.008, "args": { "External id": 17642,"Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777151.968, "dur": 0.739, "args": { "External id": 17643,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[8388608, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650777153.854, "dur": 22.561, "args": { "External id": 17644,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 235 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777187.383, "dur": 64.408, "args": { "External id": 17645,"Record function id": 0, "Sequence number": 246741, "Fwd thread id": 1, "Ev Idx": 236 } }, { "ph": "X", "cat": "cpu_op", "name": "SelectBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777188.417, "dur": 60.129, "args": { "External id": 17646,"Sequence number": 246741, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 237 } }, { "ph": "f", "id": 27, "pid": 1336754, "tid": 1381179, "ts": 1295650777188.417, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650777190.319, "dur": 57.919, "args": { "External id": 17647,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "2", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650777194.283, "dur": 19.269, "args": { "External id": 17648,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650777195.609, "dur": 2.401, "args": { "External id": 17649,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650777198.885, "dur": 14.435, "args": { "External id": 17650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650777199.704, "dur": 13.247, "args": { "External id": 17651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650777214.795, "dur": 5.681, "args": { "External id": 17652,"Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777219.269, "dur": 0.768, "args": { "External id": 17653,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650777221.295, "dur": 26.153, "args": { "External id": 17654,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 245 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777257.502, "dur": 102.929, "args": { "External id": 17655,"Record function id": 0, "Sequence number": 246740, "Fwd thread id": 1, "Ev Idx": 246 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777258.786, "dur": 98.851, "args": { "External id": 17656,"Sequence number": 246740, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 247 } }, { "ph": "f", "id": 28, "pid": 1336754, "tid": 1381179, "ts": 1295650777258.786, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650777260.806, "dur": 96.358, "args": { "External id": 17657,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650777264.627, "dur": 23.861, "args": { "External id": 17658,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650777268.584, "dur": 2.502, "args": { "External id": 17659,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650777271.856, "dur": 16.358, "args": { "External id": 17660,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650777272.875, "dur": 15.017, "args": { "External id": 17661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650777289.472, "dur": 4.501, "args": { "External id": 17662,"Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777291.304, "dur": 2.388, "args": { "External id": 17663,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650777294.617, "dur": 61.852, "args": { "External id": 17664,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 255 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777364.527, "dur": 101.011, "args": { "External id": 17665,"Record function id": 0, "Sequence number": 246739, "Fwd thread id": 1, "Ev Idx": 256 } }, { "ph": "X", "cat": "cpu_op", "name": "SliceBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777365.741, "dur": 81.137, "args": { "External id": 17666,"Sequence number": 246739, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 257 } }, { "ph": "f", "id": 29, "pid": 1336754, "tid": 1381179, "ts": 1295650777365.741, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650777367.531, "dur": 78.994, "args": { "External id": 17667,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], [], []], "Ev Idx": 258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1381179, "ts": 1295650777368.502, "dur": 23.235, "args": { "External id": 17668,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650777371.424, "dur": 1.921, "args": { "External id": 17669,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 4, 2048]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1381179, "ts": 1295650777377.499, "dur": 13.922, "args": { "External id": 17670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1381179, "ts": 1295650777379.377, "dur": 11.701, "args": { "External id": 17671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], []], "Ev Idx": 262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650777392.492, "dur": 4.788, "args": { "External id": 17672,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777396.565, "dur": 0.574, "args": { "External id": 17673,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650777398.110, "dur": 47.910, "args": { "External id": 17674,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650777450.656, "dur": 13.310, "args": { "External id": 17675,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [33554432, 8192, 2048, 1], []], "Input Dims": [[16, 4096, 4, 2048], [16, 4096, 4, 2048], []], "Ev Idx": 266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650777471.322, "dur": 330.598, "args": { "External id": 17676,"Record function id": 0, "Sequence number": 246738, "Fwd thread id": 1, "Ev Idx": 267 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650777473.226, "dur": 321.110, "args": { "External id": 17677,"Sequence number": 246738, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 268 } }, { "ph": "f", "id": 30, "pid": 1336754, "tid": 1381179, "ts": 1295650777473.226, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295650777632.514, "dur": 40.596, "args": { "External id": 17678,"kernel_hash": "cf7hg2ixt4i43dnksudd5khnoxtnhj2eb5bah2yjl2diidj4xwne", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "262144", "2048", "1", "1986", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/f7/cf7hg2ixt4i43dnksudd5khnoxtnhj2eb5bah2yjl2diidj4xwne.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [2048], [262144, 2048], [262144, 2048], [132, 2048], [262144], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 269 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_0", "pid": 1336754, "tid": 1381179, "ts": 1295650777704.517, "dur": 27.917, "args": { "External id": 17679,"kernel_hash": "c3qhxfu5zrkzpf2jybafupdlrhzermxghmhj46kd4kjqpnskd7hf", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/3q/c3qhxfu5zrkzpf2jybafupdlrhzermxghmhj46kd4kjqpnskd7hf.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 270 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_1", "pid": 1336754, "tid": 1381179, "ts": 1295650777750.938, "dur": 21.233, "args": { "External id": 17680,"kernel_hash": "chmktjza3gzdueqxxvt7hlbkykb7cdfv7coarxbxb3ldjxl472md", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/hm/chmktjza3gzdueqxxvt7hlbkykb7cdfv7coarxbxb3ldjxl472md.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 271 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650777810.138, "dur": 12.554, "args": { "External id": 17681,"Record function id": 0, "Ev Idx": 272 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650777812.641, "dur": 9.153, "args": { "External id": 17682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650777815.870, "dur": 5.113, "args": { "External id": 17683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 274 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650777818.027, "dur": 2.857, "args": { "External id": 17684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 275 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: StackBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777828.952, "dur": 32.750, "args": { "External id": 17685,"Record function id": 0, "Sequence number": 246737, "Fwd thread id": 1, "Ev Idx": 276 } }, { "ph": "X", "cat": "cpu_op", "name": "StackBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777829.922, "dur": 24.237, "args": { "External id": 17686,"Sequence number": 246737, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 2048, 1]], "Input Dims": [[16, 4096, 4, 2048]], "Ev Idx": 277 } }, { "ph": "f", "id": 31, "pid": 1336754, "tid": 1381179, "ts": 1295650777829.922, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650777831.869, "dur": 8.433, "args": { "External id": 17687,"Record function id": 0, "Concrete Inputs": ["", "-2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777837.418, "dur": 0.928, "args": { "External id": 17688,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650777840.992, "dur": 4.767, "args": { "External id": 17689,"Record function id": 0, "Concrete Inputs": ["", "-2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777843.939, "dur": 0.723, "args": { "External id": 17690,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650777846.145, "dur": 3.524, "args": { "External id": 17691,"Record function id": 0, "Concrete Inputs": ["", "-2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777848.072, "dur": 0.292, "args": { "External id": 17692,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1381179, "ts": 1295650777850.247, "dur": 3.242, "args": { "External id": 17693,"Record function id": 0, "Concrete Inputs": ["", "-2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777852.019, "dur": 0.519, "args": { "External id": 17694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 285 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777865.763, "dur": 5.546, "args": { "External id": 17695,"Record function id": 0, "Sequence number": 246736, "Fwd thread id": 1, "Ev Idx": 286 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650777866.860, "dur": 1.049, "args": { "External id": 17696,"Sequence number": 246736, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 287 } }, { "ph": "f", "id": 32, "pid": 1336754, "tid": 1381179, "ts": 1295650777866.860, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650777875.578, "dur": 578.513, "args": { "External id": 17697,"Record function id": 0, "Sequence number": 246735, "Fwd thread id": 1, "Ev Idx": 288 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650777877.195, "dur": 563.371, "args": { "External id": 17698,"Sequence number": 246735, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 289 } }, { "ph": "f", "id": 33, "pid": 1336754, "tid": 1381179, "ts": 1295650777877.195, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650777913.986, "dur": 9.395, "args": { "External id": 17699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650777919.298, "dur": 3.786, "args": { "External id": 17700,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650777927.306, "dur": 8.207, "args": { "External id": 17701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650777929.715, "dur": 4.867, "args": { "External id": 17702,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777933.588, "dur": 0.753, "args": { "External id": 17703,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1381179, "ts": 1295650777939.281, "dur": 164.327, "args": { "External id": 17704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650777940.337, "dur": 5.720, "args": { "External id": 17705,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650777941.161, "dur": 3.770, "args": { "External id": 17706,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650777942.909, "dur": 1.882, "args": { "External id": 17707,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1381179, "ts": 1295650777947.495, "dur": 155.188, "args": { "External id": 17708,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650777951.461, "dur": 149.557, "args": { "External id": 17709,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650778111.780, "dur": 5.079, "args": { "External id": 17710,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778113.826, "dur": 2.918, "args": { "External id": 17711,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650778153.922, "dur": 6.026, "args": { "External id": 17712,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650778161.341, "dur": 3.787, "args": { "External id": 17713,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650778166.334, "dur": 1.473, "args": { "External id": 17714,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778207.851, "dur": 2.900, "args": { "External id": 17715,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778208.951, "dur": 1.650, "args": { "External id": 17716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336754, "tid": 1381179, "ts": 1295650778252.172, "dur": 167.666, "args": { "External id": 17717,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650778259.146, "dur": 9.966, "args": { "External id": 17718,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778263.869, "dur": 1.372, "args": { "External id": 17719,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650778271.766, "dur": 10.142, "args": { "External id": 17720,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778278.628, "dur": 2.525, "args": { "External id": 17721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650778283.839, "dur": 2.875, "args": { "External id": 17722,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778285.908, "dur": 0.409, "args": { "External id": 17723,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650778287.843, "dur": 3.025, "args": { "External id": 17724,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778289.732, "dur": 0.577, "args": { "External id": 17725,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650778297.354, "dur": 3.313, "args": { "External id": 17726,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778299.853, "dur": 0.478, "args": { "External id": 17727,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778301.973, "dur": 7.407, "args": { "External id": 17728,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650778306.786, "dur": 2.412, "args": { "External id": 17729,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650778310.703, "dur": 3.044, "args": { "External id": 17730,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778313.028, "dur": 0.432, "args": { "External id": 17731,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778314.697, "dur": 3.119, "args": { "External id": 17732,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778316.306, "dur": 1.416, "args": { "External id": 17733,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650778319.846, "dur": 83.552, "args": { "External id": 17734,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778407.628, "dur": 2.628, "args": { "External id": 17735,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650778411.469, "dur": 3.848, "args": { "External id": 17736,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778413.840, "dur": 0.854, "args": { "External id": 17737,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778417.490, "dur": 1.195, "args": { "External id": 17738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778468.518, "dur": 11.009, "args": { "External id": 17739,"Record function id": 0, "Ev Idx": 330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778471.216, "dur": 7.523, "args": { "External id": 17740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778474.131, "dur": 3.606, "args": { "External id": 17741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778475.359, "dur": 2.270, "args": { "External id": 17742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778483.628, "dur": 10.760, "args": { "External id": 17743,"Record function id": 0, "Sequence number": 246734, "Fwd thread id": 1, "Ev Idx": 334 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778485.509, "dur": 6.092, "args": { "External id": 17744,"Sequence number": 246734, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 335 } }, { "ph": "f", "id": 34, "pid": 1336754, "tid": 1381179, "ts": 1295650778485.509, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778487.310, "dur": 4.080, "args": { "External id": 17745,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778490.459, "dur": 0.792, "args": { "External id": 17746,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778498.160, "dur": 173.261, "args": { "External id": 17747,"Record function id": 0, "Sequence number": 246733, "Fwd thread id": 1, "Ev Idx": 338 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778498.949, "dur": 165.694, "args": { "External id": 17748,"Sequence number": 246733, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 339 } }, { "ph": "f", "id": 35, "pid": 1336754, "tid": 1381179, "ts": 1295650778498.949, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778502.604, "dur": 4.801, "args": { "External id": 17749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778504.093, "dur": 2.641, "args": { "External id": 17750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778505.854, "dur": 0.723, "args": { "External id": 17751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650778508.560, "dur": 62.883, "args": { "External id": 17752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778574.725, "dur": 4.252, "args": { "External id": 17753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778575.454, "dur": 2.857, "args": { "External id": 17754,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778577.050, "dur": 1.088, "args": { "External id": 17755,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778580.201, "dur": 4.205, "args": { "External id": 17756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778580.914, "dur": 2.812, "args": { "External id": 17757,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778583.126, "dur": 0.539, "args": { "External id": 17758,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650778587.011, "dur": 76.949, "args": { "External id": 17759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778676.083, "dur": 7.068, "args": { "External id": 17760,"Record function id": 0, "Sequence number": 246732, "Fwd thread id": 1, "Ev Idx": 351 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778677.205, "dur": 4.140, "args": { "External id": 17761,"Sequence number": 246732, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 352 } }, { "ph": "f", "id": 36, "pid": 1336754, "tid": 1381179, "ts": 1295650778677.205, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778679.075, "dur": 2.132, "args": { "External id": 17762,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778679.946, "dur": 1.130, "args": { "External id": 17763,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 354 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778686.783, "dur": 10.360, "args": { "External id": 17764,"Record function id": 0, "Sequence number": 246731, "Fwd thread id": 1, "Ev Idx": 355 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778687.665, "dur": 6.950, "args": { "External id": 17765,"Sequence number": 246731, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 356 } }, { "ph": "f", "id": 37, "pid": 1336754, "tid": 1381179, "ts": 1295650778687.665, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778688.551, "dur": 5.870, "args": { "External id": 17766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778689.358, "dur": 4.533, "args": { "External id": 17767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778693.206, "dur": 0.584, "args": { "External id": 17768,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 359 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778701.249, "dur": 5.262, "args": { "External id": 17769,"Record function id": 0, "Ev Idx": 360 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778703.065, "dur": 2.986, "args": { "External id": 17770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778704.116, "dur": 1.655, "args": { "External id": 17771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 362 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778704.509, "dur": 1.097, "args": { "External id": 17772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778709.926, "dur": 6.471, "args": { "External id": 17773,"Record function id": 0, "Sequence number": 246730, "Fwd thread id": 1, "Ev Idx": 364 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778711.130, "dur": 2.632, "args": { "External id": 17774,"Sequence number": 246730, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 365 } }, { "ph": "f", "id": 38, "pid": 1336754, "tid": 1381179, "ts": 1295650778711.130, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778712.170, "dur": 1.446, "args": { "External id": 17775,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778712.864, "dur": 0.626, "args": { "External id": 17776,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 367 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778719.730, "dur": 152.305, "args": { "External id": 17777,"Record function id": 0, "Sequence number": 246729, "Fwd thread id": 1, "Ev Idx": 368 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778720.640, "dur": 144.300, "args": { "External id": 17778,"Sequence number": 246729, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 369 } }, { "ph": "f", "id": 39, "pid": 1336754, "tid": 1381179, "ts": 1295650778720.640, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778724.916, "dur": 3.354, "args": { "External id": 17779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778725.489, "dur": 2.342, "args": { "External id": 17780,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778727.163, "dur": 0.528, "args": { "External id": 17781,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650778728.982, "dur": 48.145, "args": { "External id": 17782,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778778.087, "dur": 5.725, "args": { "External id": 17783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778778.804, "dur": 4.480, "args": { "External id": 17784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778782.240, "dur": 0.921, "args": { "External id": 17785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778784.837, "dur": 4.727, "args": { "External id": 17786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778785.526, "dur": 3.571, "args": { "External id": 17787,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778787.324, "dur": 1.697, "args": { "External id": 17788,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650778789.995, "dur": 74.297, "args": { "External id": 17789,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778878.722, "dur": 35.679, "args": { "External id": 17790,"Record function id": 0, "Sequence number": 246728, "Fwd thread id": 1, "Ev Idx": 381 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778879.854, "dur": 4.375, "args": { "External id": 17791,"Sequence number": 246728, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 382 } }, { "ph": "f", "id": 40, "pid": 1336754, "tid": 1381179, "ts": 1295650778879.854, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650778881.366, "dur": 2.733, "args": { "External id": 17792,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650778882.792, "dur": 1.206, "args": { "External id": 17793,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650778887.466, "dur": 24.489, "args": { "External id": 17794,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 385 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778920.339, "dur": 8.427, "args": { "External id": 17795,"Record function id": 0, "Sequence number": 246727, "Fwd thread id": 1, "Ev Idx": 386 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650778921.342, "dur": 5.247, "args": { "External id": 17796,"Sequence number": 246727, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 387 } }, { "ph": "f", "id": 41, "pid": 1336754, "tid": 1381179, "ts": 1295650778921.342, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650778922.426, "dur": 3.940, "args": { "External id": 17797,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650778923.485, "dur": 2.325, "args": { "External id": 17798,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650778925.198, "dur": 0.495, "args": { "External id": 17799,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 390 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778933.019, "dur": 5.144, "args": { "External id": 17800,"Record function id": 0, "Ev Idx": 391 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650778934.795, "dur": 2.903, "args": { "External id": 17801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778935.768, "dur": 1.650, "args": { "External id": 17802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 393 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650778936.429, "dur": 0.852, "args": { "External id": 17803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 394 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650778942.511, "dur": 502.911, "args": { "External id": 17804,"Record function id": 0, "Sequence number": 246726, "Fwd thread id": 1, "Ev Idx": 395 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650778944.483, "dur": 486.616, "args": { "External id": 17805,"Sequence number": 246726, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 396 } }, { "ph": "f", "id": 42, "pid": 1336754, "tid": 1381179, "ts": 1295650778944.483, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1381179, "ts": 1295650778968.002, "dur": 91.633, "args": { "External id": 17806,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650778969.589, "dur": 89.757, "args": { "External id": 17807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650778972.519, "dur": 7.883, "args": { "External id": 17808,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650778976.971, "dur": 2.900, "args": { "External id": 17809,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650779030.108, "dur": 28.573, "args": { "External id": 17810,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779074.135, "dur": 3.268, "args": { "External id": 17811,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779075.146, "dur": 2.159, "args": { "External id": 17812,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779081.795, "dur": 6.340, "args": { "External id": 17813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779085.297, "dur": 2.745, "args": { "External id": 17814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650779101.462, "dur": 2.951, "args": { "External id": 17815,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650779115.827, "dur": 3.265, "args": { "External id": 17816,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779312.454, "dur": 3.504, "args": { "External id": 17817,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650779320.776, "dur": 36.492, "args": { "External id": 17818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779331.886, "dur": 0.915, "args": { "External id": 17819,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650779362.724, "dur": 31.925, "args": { "External id": 17820,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650779364.705, "dur": 29.742, "args": { "External id": 17821,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779371.561, "dur": 3.563, "args": { "External id": 17822,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650779376.200, "dur": 17.858, "args": { "External id": 17823,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650779399.267, "dur": 2.965, "args": { "External id": 17824,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779400.832, "dur": 1.267, "args": { "External id": 17825,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779409.449, "dur": 2.903, "args": { "External id": 17826,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779410.722, "dur": 1.499, "args": { "External id": 17827,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779417.259, "dur": 4.223, "args": { "External id": 17828,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779418.747, "dur": 2.648, "args": { "External id": 17829,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 420 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650779459.959, "dur": 9.277, "args": { "External id": 17830,"Record function id": 0, "Ev Idx": 421 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650779462.528, "dur": 6.020, "args": { "External id": 17831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650779464.768, "dur": 2.987, "args": { "External id": 17832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 423 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650779465.572, "dur": 2.076, "args": { "External id": 17833,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 424 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779473.119, "dur": 10.100, "args": { "External id": 17834,"Record function id": 0, "Sequence number": 246725, "Fwd thread id": 1, "Ev Idx": 425 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779474.674, "dur": 6.409, "args": { "External id": 17835,"Sequence number": 246725, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 426 } }, { "ph": "f", "id": 43, "pid": 1336754, "tid": 1381179, "ts": 1295650779474.674, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779478.599, "dur": 2.262, "args": { "External id": 17836,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779479.617, "dur": 1.076, "args": { "External id": 17837,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 428 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779486.535, "dur": 142.497, "args": { "External id": 17838,"Record function id": 0, "Sequence number": 246724, "Fwd thread id": 1, "Ev Idx": 429 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779487.437, "dur": 137.849, "args": { "External id": 17839,"Sequence number": 246724, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 430 } }, { "ph": "f", "id": 44, "pid": 1336754, "tid": 1381179, "ts": 1295650779487.437, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650779490.317, "dur": 7.167, "args": { "External id": 17840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650779491.891, "dur": 4.929, "args": { "External id": 17841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779495.934, "dur": 0.645, "args": { "External id": 17842,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650779498.432, "dur": 62.821, "args": { "External id": 17843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650779562.361, "dur": 5.267, "args": { "External id": 17844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650779563.112, "dur": 3.883, "args": { "External id": 17845,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779564.935, "dur": 1.881, "args": { "External id": 17846,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650779569.052, "dur": 4.994, "args": { "External id": 17847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650779569.890, "dur": 3.685, "args": { "External id": 17848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779572.872, "dur": 0.597, "args": { "External id": 17849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650779574.626, "dur": 49.847, "args": { "External id": 17850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 441 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779633.769, "dur": 8.147, "args": { "External id": 17851,"Record function id": 0, "Sequence number": 246723, "Fwd thread id": 1, "Ev Idx": 442 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779634.731, "dur": 5.246, "args": { "External id": 17852,"Sequence number": 246723, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 443 } }, { "ph": "f", "id": 45, "pid": 1336754, "tid": 1381179, "ts": 1295650779634.731, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779636.322, "dur": 3.483, "args": { "External id": 17853,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779637.453, "dur": 2.221, "args": { "External id": 17854,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 445 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779645.701, "dur": 9.396, "args": { "External id": 17855,"Record function id": 0, "Sequence number": 246722, "Fwd thread id": 1, "Ev Idx": 446 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779646.905, "dur": 6.008, "args": { "External id": 17856,"Sequence number": 246722, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 447 } }, { "ph": "f", "id": 46, "pid": 1336754, "tid": 1381179, "ts": 1295650779646.905, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650779647.577, "dur": 5.125, "args": { "External id": 17857,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650779648.291, "dur": 3.928, "args": { "External id": 17858,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779651.746, "dur": 0.358, "args": { "External id": 17859,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650779659.284, "dur": 5.786, "args": { "External id": 17860,"Record function id": 0, "Ev Idx": 451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650779660.747, "dur": 3.873, "args": { "External id": 17861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650779661.920, "dur": 2.464, "args": { "External id": 17862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650779662.930, "dur": 1.375, "args": { "External id": 17863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779668.164, "dur": 6.871, "args": { "External id": 17864,"Record function id": 0, "Sequence number": 246721, "Fwd thread id": 1, "Ev Idx": 455 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650779669.223, "dur": 4.055, "args": { "External id": 17865,"Sequence number": 246721, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 456 } }, { "ph": "f", "id": 47, "pid": 1336754, "tid": 1381179, "ts": 1295650779669.223, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650779670.680, "dur": 2.456, "args": { "External id": 17866,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650779671.936, "dur": 1.073, "args": { "External id": 17867,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650779679.782, "dur": 300.417, "args": { "External id": 17868,"Record function id": 0, "Sequence number": 246720, "Fwd thread id": 1, "Ev Idx": 459 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650779681.500, "dur": 283.371, "args": { "External id": 17869,"Sequence number": 246720, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 460 } }, { "ph": "f", "id": 48, "pid": 1336754, "tid": 1381179, "ts": 1295650779681.500, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650779696.435, "dur": 6.209, "args": { "External id": 17870,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779698.958, "dur": 3.176, "args": { "External id": 17871,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650779704.906, "dur": 3.687, "args": { "External id": 17872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779706.928, "dur": 1.460, "args": { "External id": 17873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650779710.426, "dur": 6.006, "args": { "External id": 17874,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650779713.167, "dur": 3.086, "args": { "External id": 17875,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 466 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650779749.324, "dur": 190.558, "args": { "External id": 17876,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650779836.479, "dur": 2.978, "args": { "External id": 17877,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650779841.391, "dur": 3.195, "args": { "External id": 17878,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650779952.059, "dur": 3.463, "args": { "External id": 17879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650779958.660, "dur": 0.940, "args": { "External id": 17880,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650779961.528, "dur": 0.956, "args": { "External id": 17881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650780027.329, "dur": 256.484, "args": { "External id": 17882,"Record function id": 0, "Sequence number": 246719, "Fwd thread id": 1, "Ev Idx": 473 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650780030.119, "dur": 245.126, "args": { "External id": 17883,"Sequence number": 246719, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 474 } }, { "ph": "f", "id": 49, "pid": 1336754, "tid": 1381179, "ts": 1295650780030.119, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650780052.968, "dur": 52.124, "args": { "External id": 17884,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780056.641, "dur": 4.417, "args": { "External id": 17885,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650780062.549, "dur": 41.829, "args": { "External id": 17886,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650780115.413, "dur": 5.482, "args": { "External id": 17887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780117.878, "dur": 2.655, "args": { "External id": 17888,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 479 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650780293.166, "dur": 162.426, "args": { "External id": 17889,"Record function id": 0, "Sequence number": 246718, "Fwd thread id": 1, "Ev Idx": 480 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650780295.195, "dur": 154.944, "args": { "External id": 17890,"Sequence number": 246718, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 481 } }, { "ph": "f", "id": 50, "pid": 1336754, "tid": 1381179, "ts": 1295650780295.195, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650780309.250, "dur": 35.726, "args": { "External id": 17891,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780312.142, "dur": 3.519, "args": { "External id": 17892,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650780316.557, "dur": 27.964, "args": { "External id": 17893,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650780353.048, "dur": 4.590, "args": { "External id": 17894,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780355.219, "dur": 2.104, "args": { "External id": 17895,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780461.350, "dur": 15.402, "args": { "External id": 17896,"Record function id": 0, "Sequence number": 246717, "Fwd thread id": 1, "Ev Idx": 487 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780462.743, "dur": 11.577, "args": { "External id": 17897,"Sequence number": 246717, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 488 } }, { "ph": "f", "id": 51, "pid": 1336754, "tid": 1381179, "ts": 1295650780462.743, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780465.518, "dur": 8.572, "args": { "External id": 17898,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780467.418, "dur": 6.443, "args": { "External id": 17899,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 490 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780480.432, "dur": 8.720, "args": { "External id": 17900,"Record function id": 0, "Sequence number": 246716, "Fwd thread id": 1, "Ev Idx": 491 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780481.477, "dur": 5.646, "args": { "External id": 17901,"Sequence number": 246716, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 492 } }, { "ph": "f", "id": 52, "pid": 1336754, "tid": 1381179, "ts": 1295650780481.477, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780482.980, "dur": 4.000, "args": { "External id": 17902,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780486.009, "dur": 0.814, "args": { "External id": 17903,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 494 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780492.310, "dur": 7.423, "args": { "External id": 17904,"Record function id": 0, "Sequence number": 246715, "Fwd thread id": 1, "Ev Idx": 495 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780493.257, "dur": 4.638, "args": { "External id": 17905,"Sequence number": 246715, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 496 } }, { "ph": "f", "id": 53, "pid": 1336754, "tid": 1381179, "ts": 1295650780493.257, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780494.837, "dur": 2.897, "args": { "External id": 17906,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780496.967, "dur": 0.676, "args": { "External id": 17907,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 498 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780503.336, "dur": 6.728, "args": { "External id": 17908,"Record function id": 0, "Sequence number": 246714, "Fwd thread id": 1, "Ev Idx": 499 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780504.466, "dur": 3.567, "args": { "External id": 17909,"Sequence number": 246714, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 500 } }, { "ph": "f", "id": 54, "pid": 1336754, "tid": 1381179, "ts": 1295650780504.466, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780505.828, "dur": 2.056, "args": { "External id": 17910,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780506.862, "dur": 0.919, "args": { "External id": 17911,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 502 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780513.356, "dur": 174.387, "args": { "External id": 17912,"Record function id": 0, "Sequence number": 246713, "Fwd thread id": 1, "Ev Idx": 503 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780516.484, "dur": 164.674, "args": { "External id": 17913,"Sequence number": 246713, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 504 } }, { "ph": "f", "id": 55, "pid": 1336754, "tid": 1381179, "ts": 1295650780516.484, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780520.240, "dur": 6.898, "args": { "External id": 17914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780521.860, "dur": 4.700, "args": { "External id": 17915,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780524.622, "dur": 1.713, "args": { "External id": 17916,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780528.844, "dur": 68.589, "args": { "External id": 17917,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780599.186, "dur": 6.630, "args": { "External id": 17918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780600.190, "dur": 4.848, "args": { "External id": 17919,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780604.138, "dur": 0.740, "args": { "External id": 17920,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780629.102, "dur": 3.274, "args": { "External id": 17921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780629.978, "dur": 1.877, "args": { "External id": 17922,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780631.397, "dur": 0.366, "args": { "External id": 17923,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780632.975, "dur": 47.291, "args": { "External id": 17924,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780692.497, "dur": 8.431, "args": { "External id": 17925,"Record function id": 0, "Sequence number": 246712, "Fwd thread id": 1, "Ev Idx": 516 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780693.385, "dur": 5.769, "args": { "External id": 17926,"Sequence number": 246712, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 517 } }, { "ph": "f", "id": 56, "pid": 1336754, "tid": 1381179, "ts": 1295650780693.385, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780694.924, "dur": 4.031, "args": { "External id": 17927,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780697.821, "dur": 1.016, "args": { "External id": 17928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 519 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780704.177, "dur": 7.382, "args": { "External id": 17929,"Record function id": 0, "Sequence number": 246711, "Fwd thread id": 1, "Ev Idx": 520 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780705.037, "dur": 3.948, "args": { "External id": 17930,"Sequence number": 246711, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 521 } }, { "ph": "f", "id": 57, "pid": 1336754, "tid": 1381179, "ts": 1295650780705.037, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780705.648, "dur": 3.120, "args": { "External id": 17931,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780706.213, "dur": 2.027, "args": { "External id": 17932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780707.732, "dur": 0.404, "args": { "External id": 17933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 524 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650780717.597, "dur": 11.929, "args": { "External id": 17934,"Record function id": 0, "Ev Idx": 525 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650780719.851, "dur": 8.817, "args": { "External id": 17935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650780722.100, "dur": 6.192, "args": { "External id": 17936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 527 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650780725.385, "dur": 2.610, "args": { "External id": 17937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 528 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780735.537, "dur": 6.090, "args": { "External id": 17938,"Record function id": 0, "Sequence number": 246710, "Fwd thread id": 1, "Ev Idx": 529 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780736.914, "dur": 2.656, "args": { "External id": 17939,"Sequence number": 246710, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 530 } }, { "ph": "f", "id": 58, "pid": 1336754, "tid": 1381179, "ts": 1295650780736.914, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780738.054, "dur": 1.370, "args": { "External id": 17940,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780738.659, "dur": 0.671, "args": { "External id": 17941,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 532 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780744.856, "dur": 86.176, "args": { "External id": 17942,"Record function id": 0, "Sequence number": 246709, "Fwd thread id": 1, "Ev Idx": 533 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780745.484, "dur": 80.715, "args": { "External id": 17943,"Sequence number": 246709, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 534 } }, { "ph": "f", "id": 59, "pid": 1336754, "tid": 1381179, "ts": 1295650780745.484, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780747.482, "dur": 4.473, "args": { "External id": 17944,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780747.894, "dur": 3.610, "args": { "External id": 17945,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780751.037, "dur": 0.365, "args": { "External id": 17946,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780752.772, "dur": 28.326, "args": { "External id": 17947,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780782.144, "dur": 3.548, "args": { "External id": 17948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780782.534, "dur": 2.638, "args": { "External id": 17949,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780784.288, "dur": 0.769, "args": { "External id": 17950,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780786.518, "dur": 6.606, "args": { "External id": 17951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780789.673, "dur": 2.967, "args": { "External id": 17952,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780790.841, "dur": 1.664, "args": { "External id": 17953,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780793.526, "dur": 31.980, "args": { "External id": 17954,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 545 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780835.337, "dur": 32.223, "args": { "External id": 17955,"Record function id": 0, "Sequence number": 246708, "Fwd thread id": 1, "Ev Idx": 546 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780836.173, "dur": 4.158, "args": { "External id": 17956,"Sequence number": 246708, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 547 } }, { "ph": "f", "id": 60, "pid": 1336754, "tid": 1381179, "ts": 1295650780836.173, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780838.101, "dur": 2.103, "args": { "External id": 17957,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780838.970, "dur": 1.107, "args": { "External id": 17958,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650780843.127, "dur": 22.212, "args": { "External id": 17959,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 550 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780871.028, "dur": 9.483, "args": { "External id": 17960,"Record function id": 0, "Sequence number": 246707, "Fwd thread id": 1, "Ev Idx": 551 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780871.962, "dur": 6.524, "args": { "External id": 17961,"Sequence number": 246707, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 552 } }, { "ph": "f", "id": 61, "pid": 1336754, "tid": 1381179, "ts": 1295650780871.962, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780874.692, "dur": 3.563, "args": { "External id": 17962,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780875.420, "dur": 2.298, "args": { "External id": 17963,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780877.176, "dur": 0.435, "args": { "External id": 17964,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 555 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650780884.635, "dur": 5.186, "args": { "External id": 17965,"Record function id": 0, "Ev Idx": 556 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650780886.799, "dur": 2.575, "args": { "External id": 17966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650780887.643, "dur": 1.397, "args": { "External id": 17967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 558 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650780888.289, "dur": 0.652, "args": { "External id": 17968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 559 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780893.140, "dur": 8.278, "args": { "External id": 17969,"Record function id": 0, "Sequence number": 246706, "Fwd thread id": 1, "Ev Idx": 560 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780894.217, "dur": 4.937, "args": { "External id": 17970,"Sequence number": 246706, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 561 } }, { "ph": "f", "id": 62, "pid": 1336754, "tid": 1381179, "ts": 1295650780894.217, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650780895.300, "dur": 3.722, "args": { "External id": 17971,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650780898.087, "dur": 0.833, "args": { "External id": 17972,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 563 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780904.377, "dur": 138.468, "args": { "External id": 17973,"Record function id": 0, "Sequence number": 246705, "Fwd thread id": 1, "Ev Idx": 564 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650780904.980, "dur": 127.998, "args": { "External id": 17974,"Sequence number": 246705, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 565 } }, { "ph": "f", "id": 63, "pid": 1336754, "tid": 1381179, "ts": 1295650780904.980, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780907.168, "dur": 2.605, "args": { "External id": 17975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780907.564, "dur": 1.782, "args": { "External id": 17976,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780908.875, "dur": 0.383, "args": { "External id": 17977,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780910.459, "dur": 28.036, "args": { "External id": 17978,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780941.710, "dur": 3.575, "args": { "External id": 17979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780942.181, "dur": 2.616, "args": { "External id": 17980,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780944.118, "dur": 0.569, "args": { "External id": 17981,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650780946.419, "dur": 2.724, "args": { "External id": 17982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650780946.969, "dur": 1.763, "args": { "External id": 17983,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650780948.317, "dur": 0.348, "args": { "External id": 17984,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650780951.771, "dur": 32.406, "args": { "External id": 17985,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781049.878, "dur": 30.404, "args": { "External id": 17986,"Record function id": 0, "Sequence number": 246704, "Fwd thread id": 1, "Ev Idx": 577 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781051.005, "dur": 4.951, "args": { "External id": 17987,"Sequence number": 246704, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 578 } }, { "ph": "f", "id": 64, "pid": 1336754, "tid": 1381179, "ts": 1295650781051.005, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781053.098, "dur": 2.673, "args": { "External id": 17988,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781054.020, "dur": 1.613, "args": { "External id": 17989,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650781058.766, "dur": 19.482, "args": { "External id": 17990,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 581 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781084.005, "dur": 13.268, "args": { "External id": 17991,"Record function id": 0, "Sequence number": 246703, "Fwd thread id": 1, "Ev Idx": 582 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781084.972, "dur": 10.442, "args": { "External id": 17992,"Sequence number": 246703, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 583 } }, { "ph": "f", "id": 65, "pid": 1336754, "tid": 1381179, "ts": 1295650781084.972, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650781085.817, "dur": 9.379, "args": { "External id": 17993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650781089.638, "dur": 4.978, "args": { "External id": 17994,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781093.886, "dur": 0.608, "args": { "External id": 17995,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 586 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781101.834, "dur": 6.103, "args": { "External id": 17996,"Record function id": 0, "Ev Idx": 587 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781103.609, "dur": 3.780, "args": { "External id": 17997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781104.890, "dur": 2.212, "args": { "External id": 17998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 589 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781105.617, "dur": 1.385, "args": { "External id": 17999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 590 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650781112.585, "dur": 387.841, "args": { "External id": 18000,"Record function id": 0, "Sequence number": 246702, "Fwd thread id": 1, "Ev Idx": 591 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650781114.308, "dur": 350.381, "args": { "External id": 18001,"Sequence number": 246702, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 592 } }, { "ph": "f", "id": 66, "pid": 1336754, "tid": 1381179, "ts": 1295650781114.308, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781146.502, "dur": 2.230, "args": { "External id": 18002,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781147.414, "dur": 1.103, "args": { "External id": 18003,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650781165.674, "dur": 5.779, "args": { "External id": 18004,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650781181.339, "dur": 1.907, "args": { "External id": 18005,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781356.641, "dur": 3.100, "args": { "External id": 18006,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650781364.091, "dur": 37.741, "args": { "External id": 18007,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781374.862, "dur": 0.948, "args": { "External id": 18008,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650781407.571, "dur": 32.106, "args": { "External id": 18009,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650781409.548, "dur": 29.851, "args": { "External id": 18010,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781414.111, "dur": 5.259, "args": { "External id": 18011,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650781421.047, "dur": 17.702, "args": { "External id": 18012,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650781446.403, "dur": 2.497, "args": { "External id": 18013,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781447.552, "dur": 1.254, "args": { "External id": 18014,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781455.186, "dur": 2.549, "args": { "External id": 18015,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781456.813, "dur": 0.822, "args": { "External id": 18016,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650781476.264, "dur": 18.085, "args": { "External id": 18017,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 608 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781513.315, "dur": 11.189, "args": { "External id": 18018,"Record function id": 0, "Ev Idx": 609 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781515.972, "dur": 7.760, "args": { "External id": 18019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781517.720, "dur": 5.178, "args": { "External id": 18020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 611 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781520.962, "dur": 1.783, "args": { "External id": 18021,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 612 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781530.722, "dur": 5.594, "args": { "External id": 18022,"Record function id": 0, "Sequence number": 246701, "Fwd thread id": 1, "Ev Idx": 613 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781532.118, "dur": 1.466, "args": { "External id": 18023,"Sequence number": 246701, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 614 } }, { "ph": "f", "id": 67, "pid": 1336754, "tid": 1381179, "ts": 1295650781532.118, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650781540.317, "dur": 403.278, "args": { "External id": 18024,"Record function id": 0, "Sequence number": 246700, "Fwd thread id": 1, "Ev Idx": 615 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650781541.897, "dur": 391.937, "args": { "External id": 18025,"Sequence number": 246700, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 616 } }, { "ph": "f", "id": 68, "pid": 1336754, "tid": 1381179, "ts": 1295650781541.897, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781569.211, "dur": 8.394, "args": { "External id": 18026,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650781574.485, "dur": 2.856, "args": { "External id": 18027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650781580.833, "dur": 6.695, "args": { "External id": 18028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650781582.268, "dur": 4.587, "args": { "External id": 18029,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781585.941, "dur": 0.734, "args": { "External id": 18030,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1381179, "ts": 1295650781591.131, "dur": 95.705, "args": { "External id": 18031,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650781591.834, "dur": 5.266, "args": { "External id": 18032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650781592.414, "dur": 4.143, "args": { "External id": 18033,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781594.339, "dur": 2.093, "args": { "External id": 18034,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1381179, "ts": 1295650781598.241, "dur": 88.090, "args": { "External id": 18035,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650781601.777, "dur": 83.838, "args": { "External id": 18036,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650781690.045, "dur": 2.872, "args": { "External id": 18037,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781691.277, "dur": 1.488, "args": { "External id": 18038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650781724.171, "dur": 5.057, "args": { "External id": 18039,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650781730.579, "dur": 1.667, "args": { "External id": 18040,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650781733.515, "dur": 1.758, "args": { "External id": 18041,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781770.373, "dur": 2.782, "args": { "External id": 18042,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781771.675, "dur": 1.335, "args": { "External id": 18043,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336754, "tid": 1381179, "ts": 1295650781793.249, "dur": 124.670, "args": { "External id": 18044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650781798.463, "dur": 6.427, "args": { "External id": 18045,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781803.103, "dur": 0.866, "args": { "External id": 18046,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650781806.937, "dur": 7.872, "args": { "External id": 18047,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781811.572, "dur": 2.564, "args": { "External id": 18048,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650781816.048, "dur": 2.822, "args": { "External id": 18049,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781818.160, "dur": 0.361, "args": { "External id": 18050,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650781819.931, "dur": 3.144, "args": { "External id": 18051,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781822.091, "dur": 0.555, "args": { "External id": 18052,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650781828.754, "dur": 2.992, "args": { "External id": 18053,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781830.750, "dur": 0.670, "args": { "External id": 18054,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781833.001, "dur": 5.569, "args": { "External id": 18055,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650781836.554, "dur": 1.850, "args": { "External id": 18056,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650781839.743, "dur": 3.283, "args": { "External id": 18057,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781842.134, "dur": 0.612, "args": { "External id": 18058,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781843.920, "dur": 4.298, "args": { "External id": 18059,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781844.950, "dur": 3.165, "args": { "External id": 18060,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650781849.460, "dur": 52.154, "args": { "External id": 18061,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781905.766, "dur": 3.104, "args": { "External id": 18062,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650781910.134, "dur": 3.385, "args": { "External id": 18063,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650781912.509, "dur": 0.509, "args": { "External id": 18064,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781915.962, "dur": 0.783, "args": { "External id": 18065,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 656 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781952.745, "dur": 8.692, "args": { "External id": 18066,"Record function id": 0, "Ev Idx": 657 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650781955.286, "dur": 5.458, "args": { "External id": 18067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781957.093, "dur": 2.787, "args": { "External id": 18068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 659 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650781958.020, "dur": 1.749, "args": { "External id": 18069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 660 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781965.521, "dur": 9.203, "args": { "External id": 18070,"Record function id": 0, "Sequence number": 246699, "Fwd thread id": 1, "Ev Idx": 661 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781967.280, "dur": 5.412, "args": { "External id": 18071,"Sequence number": 246699, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 662 } }, { "ph": "f", "id": 69, "pid": 1336754, "tid": 1381179, "ts": 1295650781967.280, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650781968.860, "dur": 3.681, "args": { "External id": 18072,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650781971.615, "dur": 0.770, "args": { "External id": 18073,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781978.019, "dur": 176.664, "args": { "External id": 18074,"Record function id": 0, "Sequence number": 246698, "Fwd thread id": 1, "Ev Idx": 665 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650781978.805, "dur": 168.858, "args": { "External id": 18075,"Sequence number": 246698, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 666 } }, { "ph": "f", "id": 70, "pid": 1336754, "tid": 1381179, "ts": 1295650781978.805, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650781981.429, "dur": 45.064, "args": { "External id": 18076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650781982.633, "dur": 42.825, "args": { "External id": 18077,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782023.649, "dur": 1.270, "args": { "External id": 18078,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782028.098, "dur": 51.820, "args": { "External id": 18079,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782083.068, "dur": 5.220, "args": { "External id": 18080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782083.935, "dur": 3.511, "args": { "External id": 18081,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782085.865, "dur": 1.411, "args": { "External id": 18082,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782089.888, "dur": 3.247, "args": { "External id": 18083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782090.681, "dur": 1.972, "args": { "External id": 18084,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782092.119, "dur": 0.472, "args": { "External id": 18085,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782095.844, "dur": 51.021, "args": { "External id": 18086,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 677 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782161.391, "dur": 7.269, "args": { "External id": 18087,"Record function id": 0, "Sequence number": 246697, "Fwd thread id": 1, "Ev Idx": 678 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782162.666, "dur": 4.801, "args": { "External id": 18088,"Sequence number": 246697, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 679 } }, { "ph": "f", "id": 71, "pid": 1336754, "tid": 1381179, "ts": 1295650782162.666, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782164.627, "dur": 2.687, "args": { "External id": 18089,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782165.902, "dur": 1.313, "args": { "External id": 18090,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 681 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782171.974, "dur": 7.716, "args": { "External id": 18091,"Record function id": 0, "Sequence number": 246696, "Fwd thread id": 1, "Ev Idx": 682 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782172.848, "dur": 4.416, "args": { "External id": 18092,"Sequence number": 246696, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 683 } }, { "ph": "f", "id": 72, "pid": 1336754, "tid": 1381179, "ts": 1295650782172.848, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782173.450, "dur": 3.599, "args": { "External id": 18093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782174.108, "dur": 2.420, "args": { "External id": 18094,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782175.910, "dur": 0.506, "args": { "External id": 18095,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782184.117, "dur": 7.705, "args": { "External id": 18096,"Record function id": 0, "Ev Idx": 687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782185.778, "dur": 5.505, "args": { "External id": 18097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782187.000, "dur": 4.000, "args": { "External id": 18098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782189.205, "dur": 1.680, "args": { "External id": 18099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782195.223, "dur": 5.676, "args": { "External id": 18100,"Record function id": 0, "Sequence number": 246695, "Fwd thread id": 1, "Ev Idx": 691 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782196.712, "dur": 2.864, "args": { "External id": 18101,"Sequence number": 246695, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 692 } }, { "ph": "f", "id": 73, "pid": 1336754, "tid": 1381179, "ts": 1295650782196.712, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782197.953, "dur": 1.484, "args": { "External id": 18102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782198.660, "dur": 0.635, "args": { "External id": 18103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782203.853, "dur": 137.987, "args": { "External id": 18104,"Record function id": 0, "Sequence number": 246694, "Fwd thread id": 1, "Ev Idx": 695 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782204.597, "dur": 127.758, "args": { "External id": 18105,"Sequence number": 246694, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 696 } }, { "ph": "f", "id": 74, "pid": 1336754, "tid": 1381179, "ts": 1295650782204.597, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782206.749, "dur": 8.958, "args": { "External id": 18106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782209.578, "dur": 5.676, "args": { "External id": 18107,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782214.714, "dur": 0.418, "args": { "External id": 18108,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782216.264, "dur": 52.812, "args": { "External id": 18109,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782271.209, "dur": 5.280, "args": { "External id": 18110,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782272.078, "dur": 3.586, "args": { "External id": 18111,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782274.011, "dur": 1.518, "args": { "External id": 18112,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782279.336, "dur": 5.363, "args": { "External id": 18113,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782280.042, "dur": 4.123, "args": { "External id": 18114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782281.642, "dur": 2.447, "args": { "External id": 18115,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782285.373, "dur": 46.280, "args": { "External id": 18116,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782347.366, "dur": 32.945, "args": { "External id": 18117,"Record function id": 0, "Sequence number": 246693, "Fwd thread id": 1, "Ev Idx": 708 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782348.504, "dur": 4.706, "args": { "External id": 18118,"Sequence number": 246693, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 709 } }, { "ph": "f", "id": 75, "pid": 1336754, "tid": 1381179, "ts": 1295650782348.504, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782350.251, "dur": 2.805, "args": { "External id": 18119,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782351.676, "dur": 1.261, "args": { "External id": 18120,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650782356.129, "dur": 21.629, "args": { "External id": 18121,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 712 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782384.070, "dur": 9.546, "args": { "External id": 18122,"Record function id": 0, "Sequence number": 246692, "Fwd thread id": 1, "Ev Idx": 713 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782387.080, "dur": 4.831, "args": { "External id": 18123,"Sequence number": 246692, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 714 } }, { "ph": "f", "id": 76, "pid": 1336754, "tid": 1381179, "ts": 1295650782387.080, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782387.765, "dur": 3.911, "args": { "External id": 18124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782388.524, "dur": 2.631, "args": { "External id": 18125,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782390.489, "dur": 0.553, "args": { "External id": 18126,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782397.966, "dur": 5.534, "args": { "External id": 18127,"Record function id": 0, "Ev Idx": 718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782399.597, "dur": 3.376, "args": { "External id": 18128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782400.695, "dur": 1.949, "args": { "External id": 18129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782401.240, "dur": 1.270, "args": { "External id": 18130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650782409.655, "dur": 404.852, "args": { "External id": 18131,"Record function id": 0, "Sequence number": 246691, "Fwd thread id": 1, "Ev Idx": 722 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650782411.300, "dur": 371.730, "args": { "External id": 18132,"Sequence number": 246691, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 723 } }, { "ph": "f", "id": 77, "pid": 1336754, "tid": 1381179, "ts": 1295650782411.300, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1381179, "ts": 1295650782435.393, "dur": 35.819, "args": { "External id": 18133,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650782437.077, "dur": 33.941, "args": { "External id": 18134,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650782440.200, "dur": 6.496, "args": { "External id": 18135,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650782443.069, "dur": 2.976, "args": { "External id": 18136,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650782447.919, "dur": 22.558, "args": { "External id": 18137,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782483.626, "dur": 2.364, "args": { "External id": 18138,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782484.764, "dur": 1.049, "args": { "External id": 18139,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782489.572, "dur": 4.100, "args": { "External id": 18140,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782490.777, "dur": 2.804, "args": { "External id": 18141,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650782507.613, "dur": 1.962, "args": { "External id": 18142,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650782520.731, "dur": 2.021, "args": { "External id": 18143,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782675.733, "dur": 2.028, "args": { "External id": 18144,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650782681.778, "dur": 32.900, "args": { "External id": 18145,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782690.578, "dur": 0.699, "args": { "External id": 18146,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650782719.893, "dur": 30.428, "args": { "External id": 18147,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650782721.721, "dur": 28.337, "args": { "External id": 18148,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782725.893, "dur": 4.004, "args": { "External id": 18149,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650782733.090, "dur": 16.499, "args": { "External id": 18150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650782754.626, "dur": 2.526, "args": { "External id": 18151,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782755.824, "dur": 1.209, "args": { "External id": 18152,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782762.907, "dur": 2.714, "args": { "External id": 18153,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782764.386, "dur": 1.130, "args": { "External id": 18154,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782768.068, "dur": 4.185, "args": { "External id": 18155,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782769.418, "dur": 2.743, "args": { "External id": 18156,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650782795.926, "dur": 16.937, "args": { "External id": 18157,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782824.099, "dur": 7.630, "args": { "External id": 18158,"Record function id": 0, "Ev Idx": 749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650782826.076, "dur": 4.927, "args": { "External id": 18159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782827.543, "dur": 2.455, "args": { "External id": 18160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650782828.430, "dur": 1.483, "args": { "External id": 18161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782835.352, "dur": 8.129, "args": { "External id": 18162,"Record function id": 0, "Sequence number": 246690, "Fwd thread id": 1, "Ev Idx": 753 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782836.884, "dur": 4.186, "args": { "External id": 18163,"Sequence number": 246690, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 754 } }, { "ph": "f", "id": 78, "pid": 1336754, "tid": 1381179, "ts": 1295650782836.884, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782838.633, "dur": 2.265, "args": { "External id": 18164,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782839.688, "dur": 1.090, "args": { "External id": 18165,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782848.852, "dur": 118.043, "args": { "External id": 18166,"Record function id": 0, "Sequence number": 246689, "Fwd thread id": 1, "Ev Idx": 757 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782849.750, "dur": 111.546, "args": { "External id": 18167,"Sequence number": 246689, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 758 } }, { "ph": "f", "id": 79, "pid": 1336754, "tid": 1381179, "ts": 1295650782849.750, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782852.380, "dur": 4.929, "args": { "External id": 18168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782853.860, "dur": 2.893, "args": { "External id": 18169,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782855.787, "dur": 0.823, "args": { "External id": 18170,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782858.028, "dur": 49.967, "args": { "External id": 18171,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782909.240, "dur": 7.179, "args": { "External id": 18172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782911.965, "dur": 3.828, "args": { "External id": 18173,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782913.616, "dur": 2.008, "args": { "External id": 18174,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650782917.799, "dur": 3.670, "args": { "External id": 18175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650782918.698, "dur": 2.315, "args": { "External id": 18176,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650782920.184, "dur": 0.707, "args": { "External id": 18177,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650782922.052, "dur": 38.344, "args": { "External id": 18178,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 769 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782971.169, "dur": 10.843, "args": { "External id": 18179,"Record function id": 0, "Sequence number": 246688, "Fwd thread id": 1, "Ev Idx": 770 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650782974.415, "dur": 5.749, "args": { "External id": 18180,"Sequence number": 246688, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 771 } }, { "ph": "f", "id": 80, "pid": 1336754, "tid": 1381179, "ts": 1295650782974.415, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650782976.298, "dur": 3.715, "args": { "External id": 18181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650782977.309, "dur": 2.607, "args": { "External id": 18182,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 773 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783024.935, "dur": 10.938, "args": { "External id": 18183,"Record function id": 0, "Sequence number": 246687, "Fwd thread id": 1, "Ev Idx": 774 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783026.706, "dur": 6.622, "args": { "External id": 18184,"Sequence number": 246687, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 775 } }, { "ph": "f", "id": 81, "pid": 1336754, "tid": 1381179, "ts": 1295650783026.706, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650783027.720, "dur": 5.392, "args": { "External id": 18185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650783028.860, "dur": 3.446, "args": { "External id": 18186,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783031.061, "dur": 0.947, "args": { "External id": 18187,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 778 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650783041.119, "dur": 8.140, "args": { "External id": 18188,"Record function id": 0, "Ev Idx": 779 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650783043.204, "dur": 5.505, "args": { "External id": 18189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650783044.586, "dur": 3.857, "args": { "External id": 18190,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 781 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650783046.925, "dur": 1.425, "args": { "External id": 18191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 782 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783052.390, "dur": 6.047, "args": { "External id": 18192,"Record function id": 0, "Sequence number": 246686, "Fwd thread id": 1, "Ev Idx": 783 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783053.108, "dur": 3.740, "args": { "External id": 18193,"Sequence number": 246686, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 784 } }, { "ph": "f", "id": 82, "pid": 1336754, "tid": 1381179, "ts": 1295650783053.108, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783054.379, "dur": 2.321, "args": { "External id": 18194,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783055.340, "dur": 1.266, "args": { "External id": 18195,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 786 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783062.872, "dur": 301.287, "args": { "External id": 18196,"Record function id": 0, "Sequence number": 246685, "Fwd thread id": 1, "Ev Idx": 787 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783064.638, "dur": 283.115, "args": { "External id": 18197,"Sequence number": 246685, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 788 } }, { "ph": "f", "id": 83, "pid": 1336754, "tid": 1381179, "ts": 1295650783064.638, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650783079.430, "dur": 7.185, "args": { "External id": 18198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783082.395, "dur": 3.792, "args": { "External id": 18199,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650783088.840, "dur": 3.659, "args": { "External id": 18200,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783090.525, "dur": 1.756, "args": { "External id": 18201,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650783093.936, "dur": 5.094, "args": { "External id": 18202,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783095.813, "dur": 3.010, "args": { "External id": 18203,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 794 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650783122.401, "dur": 198.314, "args": { "External id": 18204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650783201.018, "dur": 3.493, "args": { "External id": 18205,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650783206.484, "dur": 4.032, "args": { "External id": 18206,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650783334.021, "dur": 4.120, "args": { "External id": 18207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650783341.202, "dur": 0.830, "args": { "External id": 18208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650783343.884, "dur": 0.825, "args": { "External id": 18209,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 800 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783373.341, "dur": 218.836, "args": { "External id": 18210,"Record function id": 0, "Sequence number": 246684, "Fwd thread id": 1, "Ev Idx": 801 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783375.167, "dur": 210.281, "args": { "External id": 18211,"Sequence number": 246684, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 802 } }, { "ph": "f", "id": 84, "pid": 1336754, "tid": 1381179, "ts": 1295650783375.167, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650783394.708, "dur": 46.678, "args": { "External id": 18212,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783397.801, "dur": 3.467, "args": { "External id": 18213,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650783402.626, "dur": 38.155, "args": { "External id": 18214,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650783450.895, "dur": 4.114, "args": { "External id": 18215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783452.703, "dur": 1.955, "args": { "External id": 18216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783599.268, "dur": 143.076, "args": { "External id": 18217,"Record function id": 0, "Sequence number": 246683, "Fwd thread id": 1, "Ev Idx": 808 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650783601.099, "dur": 136.328, "args": { "External id": 18218,"Sequence number": 246683, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 809 } }, { "ph": "f", "id": 85, "pid": 1336754, "tid": 1381179, "ts": 1295650783601.099, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650783612.855, "dur": 31.356, "args": { "External id": 18219,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783615.433, "dur": 2.340, "args": { "External id": 18220,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650783618.631, "dur": 25.088, "args": { "External id": 18221,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650783651.634, "dur": 4.337, "args": { "External id": 18222,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783653.480, "dur": 2.168, "args": { "External id": 18223,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 814 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783747.812, "dur": 14.195, "args": { "External id": 18224,"Record function id": 0, "Sequence number": 246682, "Fwd thread id": 1, "Ev Idx": 815 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783750.951, "dur": 8.819, "args": { "External id": 18225,"Sequence number": 246682, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 816 } }, { "ph": "f", "id": 86, "pid": 1336754, "tid": 1381179, "ts": 1295650783750.951, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783753.479, "dur": 5.957, "args": { "External id": 18226,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783754.867, "dur": 4.320, "args": { "External id": 18227,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 818 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783765.542, "dur": 6.121, "args": { "External id": 18228,"Record function id": 0, "Sequence number": 246681, "Fwd thread id": 1, "Ev Idx": 819 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783766.506, "dur": 3.404, "args": { "External id": 18229,"Sequence number": 246681, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 820 } }, { "ph": "f", "id": 87, "pid": 1336754, "tid": 1381179, "ts": 1295650783766.506, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783767.850, "dur": 1.915, "args": { "External id": 18230,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783768.858, "dur": 0.763, "args": { "External id": 18231,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 822 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783777.111, "dur": 7.862, "args": { "External id": 18232,"Record function id": 0, "Sequence number": 246680, "Fwd thread id": 1, "Ev Idx": 823 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783777.898, "dur": 4.777, "args": { "External id": 18233,"Sequence number": 246680, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 824 } }, { "ph": "f", "id": 88, "pid": 1336754, "tid": 1381179, "ts": 1295650783777.898, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783778.963, "dur": 3.560, "args": { "External id": 18234,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783781.862, "dur": 0.545, "args": { "External id": 18235,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 826 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783788.566, "dur": 5.763, "args": { "External id": 18236,"Record function id": 0, "Sequence number": 246679, "Fwd thread id": 1, "Ev Idx": 827 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783789.728, "dur": 2.812, "args": { "External id": 18237,"Sequence number": 246679, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 828 } }, { "ph": "f", "id": 89, "pid": 1336754, "tid": 1381179, "ts": 1295650783789.728, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783790.831, "dur": 1.571, "args": { "External id": 18238,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783791.583, "dur": 0.694, "args": { "External id": 18239,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 830 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783797.817, "dur": 141.685, "args": { "External id": 18240,"Record function id": 0, "Sequence number": 246678, "Fwd thread id": 1, "Ev Idx": 831 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783798.754, "dur": 133.368, "args": { "External id": 18241,"Sequence number": 246678, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 832 } }, { "ph": "f", "id": 90, "pid": 1336754, "tid": 1381179, "ts": 1295650783798.754, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650783801.881, "dur": 7.142, "args": { "External id": 18242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650783803.243, "dur": 5.205, "args": { "External id": 18243,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783806.822, "dur": 1.411, "args": { "External id": 18244,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650783810.662, "dur": 65.736, "args": { "External id": 18245,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650783877.931, "dur": 4.458, "args": { "External id": 18246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650783878.572, "dur": 3.214, "args": { "External id": 18247,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783880.364, "dur": 1.229, "args": { "External id": 18248,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650783883.666, "dur": 5.383, "args": { "External id": 18249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650783884.585, "dur": 4.006, "args": { "External id": 18250,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783887.997, "dur": 0.495, "args": { "External id": 18251,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650783889.532, "dur": 41.683, "args": { "External id": 18252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783944.068, "dur": 6.106, "args": { "External id": 18253,"Record function id": 0, "Sequence number": 246677, "Fwd thread id": 1, "Ev Idx": 844 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783944.914, "dur": 3.887, "args": { "External id": 18254,"Sequence number": 246677, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 845 } }, { "ph": "f", "id": 91, "pid": 1336754, "tid": 1381179, "ts": 1295650783944.914, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650783946.458, "dur": 2.214, "args": { "External id": 18255,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650783947.454, "dur": 1.100, "args": { "External id": 18256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783953.288, "dur": 10.274, "args": { "External id": 18257,"Record function id": 0, "Sequence number": 246676, "Fwd thread id": 1, "Ev Idx": 848 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783954.208, "dur": 6.973, "args": { "External id": 18258,"Sequence number": 246676, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 849 } }, { "ph": "f", "id": 92, "pid": 1336754, "tid": 1381179, "ts": 1295650783954.208, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650783954.833, "dur": 6.155, "args": { "External id": 18259,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650783958.030, "dur": 2.442, "args": { "External id": 18260,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650783959.906, "dur": 0.467, "args": { "External id": 18261,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 852 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650783969.313, "dur": 9.126, "args": { "External id": 18262,"Record function id": 0, "Ev Idx": 853 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650783971.266, "dur": 6.362, "args": { "External id": 18263,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650783973.620, "dur": 3.604, "args": { "External id": 18264,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 855 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650783974.727, "dur": 2.385, "args": { "External id": 18265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783982.133, "dur": 46.757, "args": { "External id": 18266,"Record function id": 0, "Sequence number": 246675, "Fwd thread id": 1, "Ev Idx": 857 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650783983.492, "dur": 42.371, "args": { "External id": 18267,"Sequence number": 246675, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 858 } }, { "ph": "f", "id": 93, "pid": 1336754, "tid": 1381179, "ts": 1295650783983.492, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784022.304, "dur": 3.386, "args": { "External id": 18268,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784023.724, "dur": 1.730, "args": { "External id": 18269,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 860 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784035.626, "dur": 96.265, "args": { "External id": 18270,"Record function id": 0, "Sequence number": 246674, "Fwd thread id": 1, "Ev Idx": 861 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784036.556, "dur": 89.429, "args": { "External id": 18271,"Sequence number": 246674, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 862 } }, { "ph": "f", "id": 94, "pid": 1336754, "tid": 1381179, "ts": 1295650784036.556, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784038.516, "dur": 3.331, "args": { "External id": 18272,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784039.257, "dur": 2.142, "args": { "External id": 18273,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784040.630, "dur": 0.668, "args": { "External id": 18274,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650784042.465, "dur": 34.702, "args": { "External id": 18275,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784078.355, "dur": 6.513, "args": { "External id": 18276,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784081.047, "dur": 3.173, "args": { "External id": 18277,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784082.716, "dur": 1.371, "args": { "External id": 18278,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784086.080, "dur": 4.886, "args": { "External id": 18279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784086.893, "dur": 3.499, "args": { "External id": 18280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784088.180, "dur": 2.123, "args": { "External id": 18281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650784091.362, "dur": 33.857, "args": { "External id": 18282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 873 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784135.939, "dur": 34.384, "args": { "External id": 18283,"Record function id": 0, "Sequence number": 246673, "Fwd thread id": 1, "Ev Idx": 874 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784139.128, "dur": 3.586, "args": { "External id": 18284,"Sequence number": 246673, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 875 } }, { "ph": "f", "id": 95, "pid": 1336754, "tid": 1381179, "ts": 1295650784139.128, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784140.731, "dur": 1.835, "args": { "External id": 18285,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784141.572, "dur": 0.867, "args": { "External id": 18286,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650784145.696, "dur": 22.924, "args": { "External id": 18287,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784173.851, "dur": 8.769, "args": { "External id": 18288,"Record function id": 0, "Sequence number": 246672, "Fwd thread id": 1, "Ev Idx": 879 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784174.762, "dur": 5.985, "args": { "External id": 18289,"Sequence number": 246672, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 880 } }, { "ph": "f", "id": 96, "pid": 1336754, "tid": 1381179, "ts": 1295650784174.762, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784175.409, "dur": 5.106, "args": { "External id": 18290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784176.118, "dur": 3.884, "args": { "External id": 18291,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784179.359, "dur": 0.536, "args": { "External id": 18292,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 883 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784187.085, "dur": 6.648, "args": { "External id": 18293,"Record function id": 0, "Ev Idx": 884 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784189.042, "dur": 4.110, "args": { "External id": 18294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784190.427, "dur": 2.388, "args": { "External id": 18295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 886 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784191.307, "dur": 1.439, "args": { "External id": 18296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 887 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784197.311, "dur": 6.829, "args": { "External id": 18297,"Record function id": 0, "Sequence number": 246671, "Fwd thread id": 1, "Ev Idx": 888 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784199.052, "dur": 3.080, "args": { "External id": 18298,"Sequence number": 246671, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 889 } }, { "ph": "f", "id": 97, "pid": 1336754, "tid": 1381179, "ts": 1295650784199.052, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784200.163, "dur": 1.832, "args": { "External id": 18299,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784200.951, "dur": 0.929, "args": { "External id": 18300,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 891 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784209.529, "dur": 116.847, "args": { "External id": 18301,"Record function id": 0, "Sequence number": 246670, "Fwd thread id": 1, "Ev Idx": 892 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784212.442, "dur": 105.834, "args": { "External id": 18302,"Sequence number": 246670, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 893 } }, { "ph": "f", "id": 98, "pid": 1336754, "tid": 1381179, "ts": 1295650784212.442, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784214.273, "dur": 3.751, "args": { "External id": 18303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784215.035, "dur": 2.496, "args": { "External id": 18304,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784216.793, "dur": 0.636, "args": { "External id": 18305,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650784218.563, "dur": 45.962, "args": { "External id": 18306,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784266.574, "dur": 6.329, "args": { "External id": 18307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784267.317, "dur": 4.958, "args": { "External id": 18308,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784271.296, "dur": 0.868, "args": { "External id": 18309,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784274.170, "dur": 6.626, "args": { "External id": 18310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784278.536, "dur": 1.827, "args": { "External id": 18311,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784279.980, "dur": 0.304, "args": { "External id": 18312,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650784281.525, "dur": 35.995, "args": { "External id": 18313,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 904 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784332.128, "dur": 28.575, "args": { "External id": 18314,"Record function id": 0, "Sequence number": 246669, "Fwd thread id": 1, "Ev Idx": 905 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784333.142, "dur": 6.441, "args": { "External id": 18315,"Sequence number": 246669, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 906 } }, { "ph": "f", "id": 99, "pid": 1336754, "tid": 1381179, "ts": 1295650784333.142, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784336.901, "dur": 2.552, "args": { "External id": 18316,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784338.077, "dur": 1.282, "args": { "External id": 18317,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650784342.140, "dur": 16.478, "args": { "External id": 18318,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784364.247, "dur": 7.046, "args": { "External id": 18319,"Record function id": 0, "Sequence number": 246668, "Fwd thread id": 1, "Ev Idx": 910 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784365.128, "dur": 4.573, "args": { "External id": 18320,"Sequence number": 246668, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 911 } }, { "ph": "f", "id": 100, "pid": 1336754, "tid": 1381179, "ts": 1295650784365.128, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784365.937, "dur": 3.514, "args": { "External id": 18321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784366.623, "dur": 2.314, "args": { "External id": 18322,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784368.401, "dur": 0.390, "args": { "External id": 18323,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 914 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784375.454, "dur": 7.897, "args": { "External id": 18324,"Record function id": 0, "Ev Idx": 915 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784377.255, "dur": 5.597, "args": { "External id": 18325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784378.443, "dur": 4.007, "args": { "External id": 18326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 917 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784381.233, "dur": 1.143, "args": { "External id": 18327,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 918 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650784387.996, "dur": 345.598, "args": { "External id": 18328,"Record function id": 0, "Sequence number": 246667, "Fwd thread id": 1, "Ev Idx": 919 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650784389.537, "dur": 314.916, "args": { "External id": 18329,"Sequence number": 246667, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 920 } }, { "ph": "f", "id": 101, "pid": 1336754, "tid": 1381179, "ts": 1295650784389.537, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784422.874, "dur": 1.987, "args": { "External id": 18330,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784423.701, "dur": 1.041, "args": { "External id": 18331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650784439.073, "dur": 4.735, "args": { "External id": 18332,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650784455.346, "dur": 1.920, "args": { "External id": 18333,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784597.195, "dur": 1.772, "args": { "External id": 18334,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650784602.814, "dur": 35.369, "args": { "External id": 18335,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784612.989, "dur": 0.703, "args": { "External id": 18336,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650784647.446, "dur": 33.115, "args": { "External id": 18337,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650784649.144, "dur": 31.168, "args": { "External id": 18338,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784653.290, "dur": 5.044, "args": { "External id": 18339,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650784659.894, "dur": 19.839, "args": { "External id": 18340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650784687.046, "dur": 2.257, "args": { "External id": 18341,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784688.134, "dur": 1.069, "args": { "External id": 18342,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784695.335, "dur": 2.058, "args": { "External id": 18343,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784696.344, "dur": 0.936, "args": { "External id": 18344,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650784713.244, "dur": 16.829, "args": { "External id": 18345,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 936 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784744.278, "dur": 10.689, "args": { "External id": 18346,"Record function id": 0, "Ev Idx": 937 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650784746.638, "dur": 7.600, "args": { "External id": 18347,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784748.200, "dur": 4.921, "args": { "External id": 18348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 939 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650784751.333, "dur": 1.629, "args": { "External id": 18349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784758.635, "dur": 4.964, "args": { "External id": 18350,"Record function id": 0, "Sequence number": 246666, "Fwd thread id": 1, "Ev Idx": 941 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650784759.786, "dur": 0.927, "args": { "External id": 18351,"Sequence number": 246666, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 942 } }, { "ph": "f", "id": 102, "pid": 1336754, "tid": 1381179, "ts": 1295650784759.786, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650784767.793, "dur": 496.216, "args": { "External id": 18352,"Record function id": 0, "Sequence number": 246665, "Fwd thread id": 1, "Ev Idx": 943 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650784769.398, "dur": 481.002, "args": { "External id": 18353,"Sequence number": 246665, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 944 } }, { "ph": "f", "id": 103, "pid": 1336754, "tid": 1381179, "ts": 1295650784769.398, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650784797.640, "dur": 7.933, "args": { "External id": 18354,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650784802.574, "dur": 2.751, "args": { "External id": 18355,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784808.543, "dur": 6.843, "args": { "External id": 18356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784812.259, "dur": 2.552, "args": { "External id": 18357,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784813.892, "dur": 0.744, "args": { "External id": 18358,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1381179, "ts": 1295650784818.834, "dur": 99.272, "args": { "External id": 18359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650784819.642, "dur": 4.220, "args": { "External id": 18360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650784820.246, "dur": 3.086, "args": { "External id": 18361,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650784821.848, "dur": 1.380, "args": { "External id": 18362,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1381179, "ts": 1295650784827.291, "dur": 90.438, "args": { "External id": 18363,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650784828.515, "dur": 88.419, "args": { "External id": 18364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650784921.827, "dur": 2.869, "args": { "External id": 18365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650784923.167, "dur": 1.385, "args": { "External id": 18366,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650784955.298, "dur": 4.257, "args": { "External id": 18367,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650784961.047, "dur": 1.804, "args": { "External id": 18368,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650784963.664, "dur": 1.391, "args": { "External id": 18369,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785042.026, "dur": 3.440, "args": { "External id": 18370,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785043.033, "dur": 2.194, "args": { "External id": 18371,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336754, "tid": 1381179, "ts": 1295650785065.662, "dur": 148.650, "args": { "External id": 18372,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650785070.642, "dur": 5.998, "args": { "External id": 18373,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785074.691, "dur": 1.106, "args": { "External id": 18374,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650785078.682, "dur": 7.478, "args": { "External id": 18375,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785083.144, "dur": 2.410, "args": { "External id": 18376,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650785087.706, "dur": 3.119, "args": { "External id": 18377,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785090.080, "dur": 0.436, "args": { "External id": 18378,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650785091.847, "dur": 3.890, "args": { "External id": 18379,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785094.720, "dur": 0.556, "args": { "External id": 18380,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650785101.653, "dur": 2.869, "args": { "External id": 18381,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785103.706, "dur": 0.479, "args": { "External id": 18382,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785105.703, "dur": 6.301, "args": { "External id": 18383,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650785110.192, "dur": 1.634, "args": { "External id": 18384,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650785113.119, "dur": 2.625, "args": { "External id": 18385,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785115.044, "dur": 0.430, "args": { "External id": 18386,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785116.747, "dur": 4.170, "args": { "External id": 18387,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785117.676, "dur": 3.152, "args": { "External id": 18388,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650785122.580, "dur": 77.004, "args": { "External id": 18389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785203.457, "dur": 2.721, "args": { "External id": 18390,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650785207.229, "dur": 2.577, "args": { "External id": 18391,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785208.883, "dur": 0.425, "args": { "External id": 18392,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785212.221, "dur": 0.869, "args": { "External id": 18393,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785277.432, "dur": 10.837, "args": { "External id": 18394,"Record function id": 0, "Ev Idx": 985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785280.159, "dur": 7.318, "args": { "External id": 18395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785282.686, "dur": 3.942, "args": { "External id": 18396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785284.139, "dur": 2.390, "args": { "External id": 18397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785292.283, "dur": 7.984, "args": { "External id": 18398,"Record function id": 0, "Sequence number": 246664, "Fwd thread id": 1, "Ev Idx": 989 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785293.701, "dur": 4.422, "args": { "External id": 18399,"Sequence number": 246664, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 990 } }, { "ph": "f", "id": 104, "pid": 1336754, "tid": 1381179, "ts": 1295650785293.701, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785295.376, "dur": 2.549, "args": { "External id": 18400,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785296.558, "dur": 1.249, "args": { "External id": 18401,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785306.391, "dur": 181.130, "args": { "External id": 18402,"Record function id": 0, "Sequence number": 246663, "Fwd thread id": 1, "Ev Idx": 993 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785307.181, "dur": 174.208, "args": { "External id": 18403,"Sequence number": 246663, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 994 } }, { "ph": "f", "id": 105, "pid": 1336754, "tid": 1381179, "ts": 1295650785307.181, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785309.913, "dur": 4.991, "args": { "External id": 18404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785311.520, "dur": 2.786, "args": { "External id": 18405,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785313.554, "dur": 0.604, "args": { "External id": 18406,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650785315.796, "dur": 64.764, "args": { "External id": 18407,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785381.798, "dur": 6.357, "args": { "External id": 18408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785382.546, "dur": 4.860, "args": { "External id": 18409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785386.139, "dur": 1.094, "args": { "External id": 18410,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785389.504, "dur": 4.000, "args": { "External id": 18411,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785390.714, "dur": 2.324, "args": { "External id": 18412,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785392.586, "dur": 0.380, "args": { "External id": 18413,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650785394.226, "dur": 86.453, "args": { "External id": 18414,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785491.977, "dur": 9.403, "args": { "External id": 18415,"Record function id": 0, "Sequence number": 246662, "Fwd thread id": 1, "Ev Idx": 1006 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785492.971, "dur": 7.221, "args": { "External id": 18416,"Sequence number": 246662, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1007 } }, { "ph": "f", "id": 106, "pid": 1336754, "tid": 1381179, "ts": 1295650785492.971, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785494.583, "dur": 5.452, "args": { "External id": 18417,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785498.759, "dur": 1.178, "args": { "External id": 18418,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1009 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785504.731, "dur": 7.242, "args": { "External id": 18419,"Record function id": 0, "Sequence number": 246661, "Fwd thread id": 1, "Ev Idx": 1010 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785505.690, "dur": 4.475, "args": { "External id": 18420,"Sequence number": 246661, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1011 } }, { "ph": "f", "id": 107, "pid": 1336754, "tid": 1381179, "ts": 1295650785505.690, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785506.450, "dur": 3.495, "args": { "External id": 18421,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785507.125, "dur": 2.308, "args": { "External id": 18422,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785508.710, "dur": 0.581, "args": { "External id": 18423,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1014 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785515.933, "dur": 5.486, "args": { "External id": 18424,"Record function id": 0, "Ev Idx": 1015 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785517.708, "dur": 3.218, "args": { "External id": 18425,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785518.872, "dur": 1.793, "args": { "External id": 18426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1017 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785519.403, "dur": 1.189, "args": { "External id": 18427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1018 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785526.767, "dur": 8.364, "args": { "External id": 18428,"Record function id": 0, "Sequence number": 246660, "Fwd thread id": 1, "Ev Idx": 1019 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785528.152, "dur": 5.302, "args": { "External id": 18429,"Sequence number": 246660, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1020 } }, { "ph": "f", "id": 108, "pid": 1336754, "tid": 1381179, "ts": 1295650785528.152, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785531.432, "dur": 1.885, "args": { "External id": 18430,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785532.414, "dur": 0.789, "args": { "External id": 18431,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1022 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785538.118, "dur": 173.222, "args": { "External id": 18432,"Record function id": 0, "Sequence number": 246659, "Fwd thread id": 1, "Ev Idx": 1023 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785564.154, "dur": 140.508, "args": { "External id": 18433,"Sequence number": 246659, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1024 } }, { "ph": "f", "id": 109, "pid": 1336754, "tid": 1381179, "ts": 1295650785564.154, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785566.060, "dur": 4.273, "args": { "External id": 18434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785566.496, "dur": 3.405, "args": { "External id": 18435,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785569.416, "dur": 0.338, "args": { "External id": 18436,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650785570.816, "dur": 50.095, "args": { "External id": 18437,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785621.962, "dur": 4.543, "args": { "External id": 18438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785622.392, "dur": 3.581, "args": { "External id": 18439,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785624.266, "dur": 1.520, "args": { "External id": 18440,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785627.521, "dur": 7.029, "args": { "External id": 18441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785628.524, "dur": 5.556, "args": { "External id": 18442,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785632.154, "dur": 1.833, "args": { "External id": 18443,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650785635.143, "dur": 68.853, "args": { "External id": 18444,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785715.935, "dur": 35.744, "args": { "External id": 18445,"Record function id": 0, "Sequence number": 246658, "Fwd thread id": 1, "Ev Idx": 1036 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785716.820, "dur": 3.688, "args": { "External id": 18446,"Sequence number": 246658, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1037 } }, { "ph": "f", "id": 110, "pid": 1336754, "tid": 1381179, "ts": 1295650785716.820, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785718.404, "dur": 1.951, "args": { "External id": 18447,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785719.298, "dur": 0.940, "args": { "External id": 18448,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650785723.597, "dur": 25.444, "args": { "External id": 18449,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1040 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785755.281, "dur": 8.754, "args": { "External id": 18450,"Record function id": 0, "Sequence number": 246657, "Fwd thread id": 1, "Ev Idx": 1041 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650785756.028, "dur": 6.186, "args": { "External id": 18451,"Sequence number": 246657, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1042 } }, { "ph": "f", "id": 111, "pid": 1336754, "tid": 1381179, "ts": 1295650785756.028, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650785758.717, "dur": 3.309, "args": { "External id": 18452,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650785759.294, "dur": 2.151, "args": { "External id": 18453,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650785760.713, "dur": 0.619, "args": { "External id": 18454,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1045 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785768.193, "dur": 4.652, "args": { "External id": 18455,"Record function id": 0, "Ev Idx": 1046 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650785769.936, "dur": 2.428, "args": { "External id": 18456,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785770.771, "dur": 1.291, "args": { "External id": 18457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1048 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650785771.201, "dur": 0.760, "args": { "External id": 18458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1049 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650785776.769, "dur": 443.159, "args": { "External id": 18459,"Record function id": 0, "Sequence number": 246656, "Fwd thread id": 1, "Ev Idx": 1050 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650785778.677, "dur": 407.842, "args": { "External id": 18460,"Sequence number": 246656, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1051 } }, { "ph": "f", "id": 112, "pid": 1336754, "tid": 1381179, "ts": 1295650785778.677, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1381179, "ts": 1295650785801.848, "dur": 34.339, "args": { "External id": 18461,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650785803.140, "dur": 32.835, "args": { "External id": 18462,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650785806.113, "dur": 5.553, "args": { "External id": 18463,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650785808.650, "dur": 2.551, "args": { "External id": 18464,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650785812.902, "dur": 22.530, "args": { "External id": 18465,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785848.049, "dur": 2.183, "args": { "External id": 18466,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785848.820, "dur": 1.272, "args": { "External id": 18467,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650785854.032, "dur": 2.626, "args": { "External id": 18468,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650785854.987, "dur": 1.578, "args": { "External id": 18469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650785870.754, "dur": 2.055, "args": { "External id": 18470,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650785882.947, "dur": 1.818, "args": { "External id": 18471,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786073.478, "dur": 3.706, "args": { "External id": 18472,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650786081.401, "dur": 35.475, "args": { "External id": 18473,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786091.533, "dur": 0.937, "args": { "External id": 18474,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650786122.412, "dur": 31.098, "args": { "External id": 18475,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650786124.262, "dur": 29.055, "args": { "External id": 18476,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786129.081, "dur": 3.717, "args": { "External id": 18477,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650786136.226, "dur": 16.635, "args": { "External id": 18478,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650786157.476, "dur": 2.214, "args": { "External id": 18479,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786158.535, "dur": 1.046, "args": { "External id": 18480,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650786166.272, "dur": 2.201, "args": { "External id": 18481,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786167.260, "dur": 1.102, "args": { "External id": 18482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650786171.202, "dur": 3.656, "args": { "External id": 18483,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786172.405, "dur": 2.360, "args": { "External id": 18484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650786201.007, "dur": 17.569, "args": { "External id": 18485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1076 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650786248.256, "dur": 10.908, "args": { "External id": 18486,"Record function id": 0, "Ev Idx": 1077 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650786251.189, "dur": 6.972, "args": { "External id": 18487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650786253.502, "dur": 3.396, "args": { "External id": 18488,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1079 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650786254.691, "dur": 1.993, "args": { "External id": 18489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1080 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786263.997, "dur": 9.241, "args": { "External id": 18490,"Record function id": 0, "Sequence number": 246655, "Fwd thread id": 1, "Ev Idx": 1081 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786265.661, "dur": 4.873, "args": { "External id": 18491,"Sequence number": 246655, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1082 } }, { "ph": "f", "id": 113, "pid": 1336754, "tid": 1381179, "ts": 1295650786265.661, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650786267.604, "dur": 2.766, "args": { "External id": 18492,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786268.583, "dur": 1.655, "args": { "External id": 18493,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1084 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786279.092, "dur": 133.359, "args": { "External id": 18494,"Record function id": 0, "Sequence number": 246654, "Fwd thread id": 1, "Ev Idx": 1085 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786280.036, "dur": 125.409, "args": { "External id": 18495,"Sequence number": 246654, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1086 } }, { "ph": "f", "id": 114, "pid": 1336754, "tid": 1381179, "ts": 1295650786280.036, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650786283.156, "dur": 6.115, "args": { "External id": 18496,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650786284.742, "dur": 3.905, "args": { "External id": 18497,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786287.320, "dur": 1.108, "args": { "External id": 18498,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650786290.302, "dur": 59.272, "args": { "External id": 18499,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650786350.945, "dur": 6.897, "args": { "External id": 18500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650786353.948, "dur": 3.263, "args": { "External id": 18501,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786355.630, "dur": 1.405, "args": { "External id": 18502,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650786359.615, "dur": 3.806, "args": { "External id": 18503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650786360.620, "dur": 2.308, "args": { "External id": 18504,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786362.322, "dur": 0.530, "args": { "External id": 18505,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650786364.018, "dur": 40.698, "args": { "External id": 18506,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786417.151, "dur": 11.852, "args": { "External id": 18507,"Record function id": 0, "Sequence number": 246653, "Fwd thread id": 1, "Ev Idx": 1098 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786418.401, "dur": 8.360, "args": { "External id": 18508,"Sequence number": 246653, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1099 } }, { "ph": "f", "id": 115, "pid": 1336754, "tid": 1381179, "ts": 1295650786418.401, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650786422.521, "dur": 4.088, "args": { "External id": 18509,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786423.953, "dur": 2.510, "args": { "External id": 18510,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786432.786, "dur": 7.181, "args": { "External id": 18511,"Record function id": 0, "Sequence number": 246652, "Fwd thread id": 1, "Ev Idx": 1102 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786433.737, "dur": 4.581, "args": { "External id": 18512,"Sequence number": 246652, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1103 } }, { "ph": "f", "id": 116, "pid": 1336754, "tid": 1381179, "ts": 1295650786433.737, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650786434.407, "dur": 3.700, "args": { "External id": 18513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650786435.034, "dur": 2.553, "args": { "External id": 18514,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786437.020, "dur": 0.455, "args": { "External id": 18515,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1106 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650786443.735, "dur": 7.321, "args": { "External id": 18516,"Record function id": 0, "Ev Idx": 1107 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650786445.432, "dur": 5.126, "args": { "External id": 18517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650786446.427, "dur": 3.883, "args": { "External id": 18518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1109 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650786449.292, "dur": 0.914, "args": { "External id": 18519,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1110 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786456.248, "dur": 6.463, "args": { "External id": 18520,"Record function id": 0, "Sequence number": 246651, "Fwd thread id": 1, "Ev Idx": 1111 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650786457.018, "dur": 3.894, "args": { "External id": 18521,"Sequence number": 246651, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1112 } }, { "ph": "f", "id": 117, "pid": 1336754, "tid": 1381179, "ts": 1295650786457.018, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650786458.186, "dur": 2.592, "args": { "External id": 18522,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650786459.284, "dur": 1.368, "args": { "External id": 18523,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1114 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786466.993, "dur": 278.008, "args": { "External id": 18524,"Record function id": 0, "Sequence number": 246650, "Fwd thread id": 1, "Ev Idx": 1115 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786468.834, "dur": 261.146, "args": { "External id": 18525,"Sequence number": 246650, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1116 } }, { "ph": "f", "id": 118, "pid": 1336754, "tid": 1381179, "ts": 1295650786468.834, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650786483.328, "dur": 6.385, "args": { "External id": 18526,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786486.112, "dur": 3.146, "args": { "External id": 18527,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650786491.845, "dur": 4.357, "args": { "External id": 18528,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786493.271, "dur": 2.754, "args": { "External id": 18529,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650786506.916, "dur": 6.347, "args": { "External id": 18530,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786511.502, "dur": 1.581, "args": { "External id": 18531,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1122 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650786538.753, "dur": 167.103, "args": { "External id": 18532,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650786614.969, "dur": 4.678, "args": { "External id": 18533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650786621.291, "dur": 2.924, "args": { "External id": 18534,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650786717.789, "dur": 3.441, "args": { "External id": 18535,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650786724.524, "dur": 0.553, "args": { "External id": 18536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650786726.970, "dur": 0.521, "args": { "External id": 18537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1128 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786752.165, "dur": 212.554, "args": { "External id": 18538,"Record function id": 0, "Sequence number": 246649, "Fwd thread id": 1, "Ev Idx": 1129 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786754.335, "dur": 203.842, "args": { "External id": 18539,"Sequence number": 246649, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1130 } }, { "ph": "f", "id": 119, "pid": 1336754, "tid": 1381179, "ts": 1295650786754.335, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650786773.515, "dur": 44.084, "args": { "External id": 18540,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786776.713, "dur": 2.914, "args": { "External id": 18541,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650786781.066, "dur": 35.965, "args": { "External id": 18542,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650786827.113, "dur": 4.538, "args": { "External id": 18543,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650786828.998, "dur": 2.353, "args": { "External id": 18544,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1135 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786970.720, "dur": 216.365, "args": { "External id": 18545,"Record function id": 0, "Sequence number": 246648, "Fwd thread id": 1, "Ev Idx": 1136 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650786972.908, "dur": 207.177, "args": { "External id": 18546,"Sequence number": 246648, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1137 } }, { "ph": "f", "id": 120, "pid": 1336754, "tid": 1381179, "ts": 1295650786972.908, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650787023.135, "dur": 52.865, "args": { "External id": 18547,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787027.305, "dur": 4.149, "args": { "External id": 18548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650787037.200, "dur": 38.303, "args": { "External id": 18549,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650787084.853, "dur": 4.535, "args": { "External id": 18550,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787086.950, "dur": 2.095, "args": { "External id": 18551,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1142 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787196.686, "dur": 14.360, "args": { "External id": 18552,"Record function id": 0, "Sequence number": 246647, "Fwd thread id": 1, "Ev Idx": 1143 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787198.411, "dur": 10.233, "args": { "External id": 18553,"Sequence number": 246647, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1144 } }, { "ph": "f", "id": 121, "pid": 1336754, "tid": 1381179, "ts": 1295650787198.411, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787201.117, "dur": 7.220, "args": { "External id": 18554,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787202.427, "dur": 5.733, "args": { "External id": 18555,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1146 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787214.603, "dur": 6.050, "args": { "External id": 18556,"Record function id": 0, "Sequence number": 246646, "Fwd thread id": 1, "Ev Idx": 1147 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787215.426, "dur": 3.476, "args": { "External id": 18557,"Sequence number": 246646, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1148 } }, { "ph": "f", "id": 122, "pid": 1336754, "tid": 1381179, "ts": 1295650787215.426, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787216.910, "dur": 1.864, "args": { "External id": 18558,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787217.975, "dur": 0.661, "args": { "External id": 18559,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1150 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787223.854, "dur": 26.770, "args": { "External id": 18560,"Record function id": 0, "Sequence number": 246645, "Fwd thread id": 1, "Ev Idx": 1151 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787224.602, "dur": 22.885, "args": { "External id": 18561,"Sequence number": 246645, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1152 } }, { "ph": "f", "id": 123, "pid": 1336754, "tid": 1381179, "ts": 1295650787224.602, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787243.975, "dur": 3.311, "args": { "External id": 18562,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787245.528, "dur": 1.511, "args": { "External id": 18563,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787255.650, "dur": 6.362, "args": { "External id": 18564,"Record function id": 0, "Sequence number": 246644, "Fwd thread id": 1, "Ev Idx": 1155 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787256.891, "dur": 3.231, "args": { "External id": 18565,"Sequence number": 246644, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1156 } }, { "ph": "f", "id": 124, "pid": 1336754, "tid": 1381179, "ts": 1295650787256.891, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787258.155, "dur": 1.826, "args": { "External id": 18566,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787258.815, "dur": 1.064, "args": { "External id": 18567,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1158 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787265.261, "dur": 153.091, "args": { "External id": 18568,"Record function id": 0, "Sequence number": 246643, "Fwd thread id": 1, "Ev Idx": 1159 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787266.254, "dur": 144.002, "args": { "External id": 18569,"Sequence number": 246643, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1160 } }, { "ph": "f", "id": 125, "pid": 1336754, "tid": 1381179, "ts": 1295650787266.254, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787269.781, "dur": 9.251, "args": { "External id": 18570,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787273.624, "dur": 4.768, "args": { "External id": 18571,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787276.475, "dur": 1.658, "args": { "External id": 18572,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787280.389, "dur": 69.680, "args": { "External id": 18573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787351.533, "dur": 4.949, "args": { "External id": 18574,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787352.424, "dur": 3.386, "args": { "External id": 18575,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787354.616, "dur": 1.035, "args": { "External id": 18576,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787358.369, "dur": 6.911, "args": { "External id": 18577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787362.036, "dur": 2.546, "args": { "External id": 18578,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787364.027, "dur": 0.458, "args": { "External id": 18579,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787366.134, "dur": 43.413, "args": { "External id": 18580,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1171 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787425.500, "dur": 7.969, "args": { "External id": 18581,"Record function id": 0, "Sequence number": 246642, "Fwd thread id": 1, "Ev Idx": 1172 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787426.520, "dur": 4.971, "args": { "External id": 18582,"Sequence number": 246642, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1173 } }, { "ph": "f", "id": 126, "pid": 1336754, "tid": 1381179, "ts": 1295650787426.520, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787428.446, "dur": 2.892, "args": { "External id": 18583,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787429.900, "dur": 1.273, "args": { "External id": 18584,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1175 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787436.843, "dur": 9.981, "args": { "External id": 18585,"Record function id": 0, "Sequence number": 246641, "Fwd thread id": 1, "Ev Idx": 1176 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787437.909, "dur": 6.628, "args": { "External id": 18586,"Sequence number": 246641, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1177 } }, { "ph": "f", "id": 127, "pid": 1336754, "tid": 1381179, "ts": 1295650787437.909, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787440.354, "dur": 3.954, "args": { "External id": 18587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787441.264, "dur": 2.532, "args": { "External id": 18588,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787443.233, "dur": 0.451, "args": { "External id": 18589,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787452.914, "dur": 9.051, "args": { "External id": 18590,"Record function id": 0, "Ev Idx": 1181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787455.021, "dur": 6.171, "args": { "External id": 18591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787457.220, "dur": 3.585, "args": { "External id": 18592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787458.381, "dur": 2.322, "args": { "External id": 18593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787465.254, "dur": 8.210, "args": { "External id": 18594,"Record function id": 0, "Sequence number": 246640, "Fwd thread id": 1, "Ev Idx": 1185 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787466.820, "dur": 5.038, "args": { "External id": 18595,"Sequence number": 246640, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1186 } }, { "ph": "f", "id": 128, "pid": 1336754, "tid": 1381179, "ts": 1295650787466.820, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787467.847, "dur": 3.865, "args": { "External id": 18596,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787470.873, "dur": 0.737, "args": { "External id": 18597,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787476.540, "dur": 91.164, "args": { "External id": 18598,"Record function id": 0, "Sequence number": 246639, "Fwd thread id": 1, "Ev Idx": 1189 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787477.327, "dur": 84.936, "args": { "External id": 18599,"Sequence number": 246639, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1190 } }, { "ph": "f", "id": 129, "pid": 1336754, "tid": 1381179, "ts": 1295650787477.327, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787479.131, "dur": 3.367, "args": { "External id": 18600,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787479.752, "dur": 2.315, "args": { "External id": 18601,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787481.608, "dur": 0.360, "args": { "External id": 18602,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787483.361, "dur": 28.656, "args": { "External id": 18603,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787515.312, "dur": 3.786, "args": { "External id": 18604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787515.799, "dur": 2.774, "args": { "External id": 18605,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787517.768, "dur": 0.693, "args": { "External id": 18606,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787520.106, "dur": 4.909, "args": { "External id": 18607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787521.189, "dur": 3.393, "args": { "External id": 18608,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787522.406, "dur": 2.088, "args": { "External id": 18609,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787527.436, "dur": 34.214, "args": { "External id": 18610,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1201 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787572.140, "dur": 32.237, "args": { "External id": 18611,"Record function id": 0, "Sequence number": 246638, "Fwd thread id": 1, "Ev Idx": 1202 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787573.199, "dur": 3.976, "args": { "External id": 18612,"Sequence number": 246638, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1203 } }, { "ph": "f", "id": 130, "pid": 1336754, "tid": 1381179, "ts": 1295650787573.199, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787574.906, "dur": 2.133, "args": { "External id": 18613,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787576.049, "dur": 0.868, "args": { "External id": 18614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650787580.071, "dur": 22.339, "args": { "External id": 18615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1206 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787607.954, "dur": 8.886, "args": { "External id": 18616,"Record function id": 0, "Sequence number": 246637, "Fwd thread id": 1, "Ev Idx": 1207 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787608.965, "dur": 6.442, "args": { "External id": 18617,"Sequence number": 246637, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1208 } }, { "ph": "f", "id": 131, "pid": 1336754, "tid": 1381179, "ts": 1295650787608.965, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787609.734, "dur": 5.456, "args": { "External id": 18618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787612.114, "dur": 2.572, "args": { "External id": 18619,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787613.963, "dur": 0.598, "args": { "External id": 18620,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787620.933, "dur": 5.279, "args": { "External id": 18621,"Record function id": 0, "Ev Idx": 1212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787622.481, "dur": 3.248, "args": { "External id": 18622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787623.493, "dur": 1.943, "args": { "External id": 18623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787624.165, "dur": 1.200, "args": { "External id": 18624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787629.554, "dur": 9.097, "args": { "External id": 18625,"Record function id": 0, "Sequence number": 246636, "Fwd thread id": 1, "Ev Idx": 1216 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787631.009, "dur": 6.194, "args": { "External id": 18626,"Sequence number": 246636, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1217 } }, { "ph": "f", "id": 132, "pid": 1336754, "tid": 1381179, "ts": 1295650787631.009, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787632.225, "dur": 4.845, "args": { "External id": 18627,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787636.022, "dur": 0.941, "args": { "External id": 18628,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787643.568, "dur": 86.787, "args": { "External id": 18629,"Record function id": 0, "Sequence number": 246635, "Fwd thread id": 1, "Ev Idx": 1220 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787644.227, "dur": 79.194, "args": { "External id": 18630,"Sequence number": 246635, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1221 } }, { "ph": "f", "id": 133, "pid": 1336754, "tid": 1381179, "ts": 1295650787644.227, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787645.827, "dur": 3.242, "args": { "External id": 18631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787646.460, "dur": 2.165, "args": { "External id": 18632,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787647.966, "dur": 0.541, "args": { "External id": 18633,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787649.882, "dur": 28.312, "args": { "External id": 18634,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787679.518, "dur": 5.948, "args": { "External id": 18635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787682.005, "dur": 2.920, "args": { "External id": 18636,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787683.547, "dur": 1.207, "args": { "External id": 18637,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787686.633, "dur": 3.413, "args": { "External id": 18638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787687.921, "dur": 1.766, "args": { "External id": 18639,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787689.310, "dur": 0.311, "args": { "External id": 18640,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650787690.650, "dur": 32.071, "args": { "External id": 18641,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1232 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787734.595, "dur": 31.055, "args": { "External id": 18642,"Record function id": 0, "Sequence number": 246634, "Fwd thread id": 1, "Ev Idx": 1233 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787735.731, "dur": 5.824, "args": { "External id": 18643,"Sequence number": 246634, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1234 } }, { "ph": "f", "id": 134, "pid": 1336754, "tid": 1381179, "ts": 1295650787735.731, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787739.023, "dur": 2.401, "args": { "External id": 18644,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787740.242, "dur": 1.086, "args": { "External id": 18645,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650787743.648, "dur": 20.266, "args": { "External id": 18646,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1237 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787769.200, "dur": 7.438, "args": { "External id": 18647,"Record function id": 0, "Sequence number": 246633, "Fwd thread id": 1, "Ev Idx": 1238 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650787770.457, "dur": 4.346, "args": { "External id": 18648,"Sequence number": 246633, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1239 } }, { "ph": "f", "id": 135, "pid": 1336754, "tid": 1381179, "ts": 1295650787770.457, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650787771.392, "dur": 3.226, "args": { "External id": 18649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650787771.865, "dur": 2.265, "args": { "External id": 18650,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650787773.510, "dur": 0.495, "args": { "External id": 18651,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787780.778, "dur": 7.119, "args": { "External id": 18652,"Record function id": 0, "Ev Idx": 1243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650787782.663, "dur": 4.766, "args": { "External id": 18653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787783.544, "dur": 3.622, "args": { "External id": 18654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650787786.329, "dur": 0.735, "args": { "External id": 18655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650787793.926, "dur": 391.413, "args": { "External id": 18656,"Record function id": 0, "Sequence number": 246632, "Fwd thread id": 1, "Ev Idx": 1247 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650787795.911, "dur": 356.838, "args": { "External id": 18657,"Sequence number": 246632, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1248 } }, { "ph": "f", "id": 136, "pid": 1336754, "tid": 1381179, "ts": 1295650787795.911, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650787824.098, "dur": 2.295, "args": { "External id": 18658,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650787825.088, "dur": 1.153, "args": { "External id": 18659,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650787840.377, "dur": 4.797, "args": { "External id": 18660,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650787853.977, "dur": 1.450, "args": { "External id": 18661,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788045.574, "dur": 2.953, "args": { "External id": 18662,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650788052.981, "dur": 38.501, "args": { "External id": 18663,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788063.771, "dur": 0.884, "args": { "External id": 18664,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650788097.306, "dur": 30.560, "args": { "External id": 18665,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650788099.345, "dur": 28.319, "args": { "External id": 18666,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788103.943, "dur": 4.776, "args": { "External id": 18667,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650788110.097, "dur": 17.050, "args": { "External id": 18668,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650788132.419, "dur": 4.257, "args": { "External id": 18669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788135.486, "dur": 1.085, "args": { "External id": 18670,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788143.328, "dur": 2.403, "args": { "External id": 18671,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788144.704, "dur": 0.867, "args": { "External id": 18672,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650788163.502, "dur": 17.287, "args": { "External id": 18673,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1264 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788197.573, "dur": 9.329, "args": { "External id": 18674,"Record function id": 0, "Ev Idx": 1265 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788200.188, "dur": 5.988, "args": { "External id": 18675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788202.261, "dur": 2.975, "args": { "External id": 18676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1267 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788203.370, "dur": 1.791, "args": { "External id": 18677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1268 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788210.851, "dur": 7.315, "args": { "External id": 18678,"Record function id": 0, "Sequence number": 246631, "Fwd thread id": 1, "Ev Idx": 1269 } }, { "ph": "X", "cat": "cpu_op", "name": "AddBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788214.089, "dur": 1.299, "args": { "External id": 18679,"Sequence number": 246631, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1270 } }, { "ph": "f", "id": 137, "pid": 1336754, "tid": 1381179, "ts": 1295650788214.089, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650788222.144, "dur": 420.254, "args": { "External id": 18680,"Record function id": 0, "Sequence number": 246630, "Fwd thread id": 1, "Ev Idx": 1271 } }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650788223.841, "dur": 408.766, "args": { "External id": 18681,"Sequence number": 246630, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1272 } }, { "ph": "f", "id": 138, "pid": 1336754, "tid": 1381179, "ts": 1295650788223.841, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788268.536, "dur": 9.922, "args": { "External id": 18682,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650788274.429, "dur": 3.689, "args": { "External id": 18683,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]", "[8192, 1]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[33554432, 8192, 1], [], []], "Input Dims": [[16, 4096, 2048], [], []], "Ev Idx": 1274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788281.642, "dur": 7.101, "args": { "External id": 18684,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788283.191, "dur": 4.956, "args": { "External id": 18685,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788287.076, "dur": 0.895, "args": { "External id": 18686,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1381179, "ts": 1295650788292.125, "dur": 89.446, "args": { "External id": 18687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8192, 1], [1, 5632], []], "Input Dims": [[65536, 2048], [5632, 2048], []], "Ev Idx": 1278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788293.066, "dur": 5.155, "args": { "External id": 18688,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 5632]], "Input Dims": [[5632, 2048]], "Ev Idx": 1279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788293.922, "dur": 3.750, "args": { "External id": 18689,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 5632], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788295.499, "dur": 2.052, "args": { "External id": 18690,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[5632, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 5632], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1381179, "ts": 1295650788299.338, "dur": 81.579, "args": { "External id": 18691,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650788300.478, "dur": 79.542, "args": { "External id": 18692,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8192, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 1283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650788387.846, "dur": 3.184, "args": { "External id": 18693,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [23068672, 5632, 1]], "Input Dims": [[65536, 5632], [16, 4096, 5632]], "Ev Idx": 1284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788389.279, "dur": 1.625, "args": { "External id": 18694,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650788423.528, "dur": 5.001, "args": { "External id": 18695,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650788430.274, "dur": 1.817, "args": { "External id": 18696,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650788433.093, "dur": 1.838, "args": { "External id": 18697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788468.432, "dur": 2.652, "args": { "External id": 18698,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788469.758, "dur": 1.179, "args": { "External id": 18699,"Record function id": 0, "Concrete Inputs": ["", "[-1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::einsum", "pid": 1336754, "tid": 1381179, "ts": 1295650788492.413, "dur": 121.547, "args": { "External id": 18700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["", "TensorList", ""], "Input Strides": [[], [[8192, 1], [5632, 1]], []], "Input Dims": [[], [[65536, 2048], [65536, 5632]], []], "Ev Idx": 1291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650788497.460, "dur": 6.510, "args": { "External id": 18701,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788501.470, "dur": 1.497, "args": { "External id": 18702,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048, 1]", "[8192, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650788505.910, "dur": 6.459, "args": { "External id": 18703,"Record function id": 0, "Concrete Inputs": ["", "[1, 2, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8192, 1, 1], []], "Input Dims": [[65536, 2048, 1], []], "Ev Idx": 1294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788509.777, "dur": 1.970, "args": { "External id": 18704,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 65536]", "[1, 1, 8192]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[65536, 2048, 1], [], [], []], "Ev Idx": 1295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1381179, "ts": 1295650788513.821, "dur": 2.718, "args": { "External id": 18705,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 1296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788515.915, "dur": 0.280, "args": { "External id": 18706,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650788517.663, "dur": 4.029, "args": { "External id": 18707,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788520.332, "dur": 0.676, "args": { "External id": 18708,"Record function id": 0, "Concrete Inputs": ["", "[1, 5632, 65536]", "[1, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1, 1], [], [], []], "Input Dims": [[65536, 5632, 1], [], [], []], "Ev Idx": 1299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650788527.824, "dur": 3.429, "args": { "External id": 18709,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 8192], []], "Input Dims": [[2048, 1, 65536], []], "Ev Idx": 1300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788530.217, "dur": 0.715, "args": { "External id": 18710,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536, 1]", "[1, 8192, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 8192], [], [], []], "Input Dims": [[2048, 1, 65536], [], [], []], "Ev Idx": 1301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788532.526, "dur": 5.522, "args": { "External id": 18711,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 8192, 1], []], "Input Dims": [[2048, 65536, 1], []], "Ev Idx": 1302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_reshape_alias", "pid": 1336754, "tid": 1381179, "ts": 1295650788535.868, "dur": 1.987, "args": { "External id": 18712,"Record function id": 0, "Concrete Inputs": ["", "[1, 2048, 65536]", "[2048, 1, 8192]"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList"], "Input Strides": [[1, 8192, 1], [], []], "Input Dims": [[2048, 65536, 1], [], []], "Ev Idx": 1303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650788539.028, "dur": 3.035, "args": { "External id": 18713,"Record function id": 0, "Concrete Inputs": ["", "[2, 1, 0]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1, 1, 5632], []], "Input Dims": [[1, 5632, 65536], []], "Ev Idx": 1304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788541.515, "dur": 0.262, "args": { "External id": 18714,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632, 1]", "[5632, 1, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1, 5632], [], [], []], "Input Dims": [[1, 5632, 65536], [], [], []], "Ev Idx": 1305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788543.318, "dur": 4.861, "args": { "External id": 18715,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788544.467, "dur": 3.623, "args": { "External id": 18716,"Record function id": 0, "Concrete Inputs": ["", "[1, 65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 1], []], "Input Dims": [[65536, 5632, 1], []], "Ev Idx": 1307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650788549.243, "dur": 51.496, "args": { "External id": 18717,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1, 8192], [369098752, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632]], "Ev Idx": 1308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788602.874, "dur": 2.062, "args": { "External id": 18718,"Record function id": 0, "Concrete Inputs": ["", "[2048, 1, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[11534336, 5632, 1], []], "Input Dims": [[1, 2048, 5632], []], "Ev Idx": 1309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::permute", "pid": 1336754, "tid": 1381179, "ts": 1295650788605.945, "dur": 3.565, "args": { "External id": 18719,"Record function id": 0, "Concrete Inputs": ["", "[0, 2, 1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 5632, 1], []], "Input Dims": [[2048, 1, 5632], []], "Ev Idx": 1310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788608.347, "dur": 0.587, "args": { "External id": 18720,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632, 1]", "[5632, 1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 5632, 1], [], [], []], "Input Dims": [[2048, 1, 5632], [], [], []], "Ev Idx": 1311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788611.968, "dur": 0.977, "args": { "External id": 18721,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1, 5632], []], "Input Dims": [[2048, 5632, 1], []], "Ev Idx": 1312 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788652.559, "dur": 9.535, "args": { "External id": 18722,"Record function id": 0, "Ev Idx": 1313 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788655.370, "dur": 6.068, "args": { "External id": 18723,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788657.189, "dur": 3.396, "args": { "External id": 18724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1315 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788658.277, "dur": 2.178, "args": { "External id": 18725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1316 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788666.211, "dur": 8.116, "args": { "External id": 18726,"Record function id": 0, "Sequence number": 246629, "Fwd thread id": 1, "Ev Idx": 1317 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788667.686, "dur": 4.481, "args": { "External id": 18727,"Sequence number": 246629, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1318 } }, { "ph": "f", "id": 139, "pid": 1336754, "tid": 1381179, "ts": 1295650788667.686, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788669.649, "dur": 2.344, "args": { "External id": 18728,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788671.104, "dur": 0.770, "args": { "External id": 18729,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1320 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788677.820, "dur": 118.177, "args": { "External id": 18730,"Record function id": 0, "Sequence number": 246628, "Fwd thread id": 1, "Ev Idx": 1321 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788678.805, "dur": 111.725, "args": { "External id": 18731,"Sequence number": 246628, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1322 } }, { "ph": "f", "id": 140, "pid": 1336754, "tid": 1381179, "ts": 1295650788678.805, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788683.340, "dur": 4.453, "args": { "External id": 18732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788684.595, "dur": 2.627, "args": { "External id": 18733,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788686.583, "dur": 0.468, "args": { "External id": 18734,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650788688.731, "dur": 40.371, "args": { "External id": 18735,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788730.228, "dur": 6.583, "args": { "External id": 18736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788731.317, "dur": 4.826, "args": { "External id": 18737,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788735.040, "dur": 0.937, "args": { "External id": 18738,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788738.379, "dur": 3.313, "args": { "External id": 18739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788739.525, "dur": 1.721, "args": { "External id": 18740,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788740.780, "dur": 0.382, "args": { "External id": 18741,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650788742.091, "dur": 47.555, "args": { "External id": 18742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788800.670, "dur": 8.524, "args": { "External id": 18743,"Record function id": 0, "Sequence number": 246627, "Fwd thread id": 1, "Ev Idx": 1334 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788801.694, "dur": 5.873, "args": { "External id": 18744,"Sequence number": 246627, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1335 } }, { "ph": "f", "id": 141, "pid": 1336754, "tid": 1381179, "ts": 1295650788801.694, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788803.374, "dur": 4.056, "args": { "External id": 18745,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788806.352, "dur": 0.958, "args": { "External id": 18746,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788812.678, "dur": 6.890, "args": { "External id": 18747,"Record function id": 0, "Sequence number": 246626, "Fwd thread id": 1, "Ev Idx": 1338 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788813.551, "dur": 4.372, "args": { "External id": 18748,"Sequence number": 246626, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1339 } }, { "ph": "f", "id": 142, "pid": 1336754, "tid": 1381179, "ts": 1295650788813.551, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788814.442, "dur": 3.271, "args": { "External id": 18749,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788814.957, "dur": 2.295, "args": { "External id": 18750,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788816.772, "dur": 0.371, "args": { "External id": 18751,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1342 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788823.426, "dur": 5.273, "args": { "External id": 18752,"Record function id": 0, "Ev Idx": 1343 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650788825.585, "dur": 2.647, "args": { "External id": 18753,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788826.474, "dur": 1.539, "args": { "External id": 18754,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1345 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650788827.051, "dur": 0.877, "args": { "External id": 18755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1346 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788832.147, "dur": 8.313, "args": { "External id": 18756,"Record function id": 0, "Sequence number": 246625, "Fwd thread id": 1, "Ev Idx": 1347 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788833.538, "dur": 5.187, "args": { "External id": 18757,"Sequence number": 246625, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[23068672, 5632, 1]], "Input Dims": [[16, 4096, 5632]], "Ev Idx": 1348 } }, { "ph": "f", "id": 143, "pid": 1336754, "tid": 1381179, "ts": 1295650788833.538, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788837.172, "dur": 1.412, "args": { "External id": 18758,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788837.785, "dur": 0.683, "args": { "External id": 18759,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 1350 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788843.428, "dur": 106.643, "args": { "External id": 18760,"Record function id": 0, "Sequence number": 246624, "Fwd thread id": 1, "Ev Idx": 1351 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788844.080, "dur": 99.513, "args": { "External id": 18761,"Sequence number": 246624, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1352 } }, { "ph": "f", "id": 144, "pid": 1336754, "tid": 1381179, "ts": 1295650788844.080, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788845.801, "dur": 4.464, "args": { "External id": 18762,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[65536, 5632]], "Ev Idx": 1353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788846.303, "dur": 3.496, "args": { "External id": 18763,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[65536, 5632], [], []], "Ev Idx": 1354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788849.303, "dur": 0.375, "args": { "External id": 18764,"Record function id": 0, "Concrete Inputs": ["", "[5632, 65536]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[65536, 5632], [], [], []], "Ev Idx": 1355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650788851.037, "dur": 31.824, "args": { "External id": 18765,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048]], "Ev Idx": 1356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788883.942, "dur": 3.636, "args": { "External id": 18766,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788884.554, "dur": 2.481, "args": { "External id": 18767,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 1358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788886.355, "dur": 0.543, "args": { "External id": 18768,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 1359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650788888.601, "dur": 6.307, "args": { "External id": 18769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650788889.760, "dur": 4.742, "args": { "External id": 18770,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650788892.795, "dur": 1.642, "args": { "External id": 18771,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650788895.313, "dur": 47.521, "args": { "External id": 18772,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 1363 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788956.800, "dur": 79.273, "args": { "External id": 18773,"Record function id": 0, "Sequence number": 246623, "Fwd thread id": 1, "Ev Idx": 1364 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650788957.767, "dur": 4.811, "args": { "External id": 18774,"Sequence number": 246623, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1365 } }, { "ph": "f", "id": 145, "pid": 1336754, "tid": 1381179, "ts": 1295650788957.767, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650788959.934, "dur": 2.496, "args": { "External id": 18775,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650788961.265, "dur": 1.071, "args": { "External id": 18776,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650788965.313, "dur": 66.245, "args": { "External id": 18777,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789042.155, "dur": 11.512, "args": { "External id": 18778,"Record function id": 0, "Sequence number": 246622, "Fwd thread id": 1, "Ev Idx": 1369 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789043.487, "dur": 8.374, "args": { "External id": 18779,"Sequence number": 246622, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1370 } }, { "ph": "f", "id": 146, "pid": 1336754, "tid": 1381179, "ts": 1295650789043.487, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650789044.641, "dur": 6.983, "args": { "External id": 18780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 5632]], "Ev Idx": 1371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650789047.677, "dur": 3.245, "args": { "External id": 18781,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 1372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789049.952, "dur": 0.843, "args": { "External id": 18782,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 1373 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789057.903, "dur": 6.122, "args": { "External id": 18783,"Record function id": 0, "Ev Idx": 1374 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789059.763, "dur": 3.692, "args": { "External id": 18784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789061.272, "dur": 1.895, "args": { "External id": 18785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1376 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789061.832, "dur": 1.225, "args": { "External id": 18786,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1377 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650789068.952, "dur": 433.386, "args": { "External id": 18787,"Record function id": 0, "Sequence number": 246621, "Fwd thread id": 1, "Ev Idx": 1378 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650789074.813, "dur": 393.985, "args": { "External id": 18788,"Sequence number": 246621, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 1379 } }, { "ph": "f", "id": 147, "pid": 1336754, "tid": 1381179, "ts": 1295650789074.813, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1381179, "ts": 1295650789099.199, "dur": 38.056, "args": { "External id": 18789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650789100.644, "dur": 36.412, "args": { "External id": 18790,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650789103.516, "dur": 6.776, "args": { "External id": 18791,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], [], []], "Ev Idx": 1382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650789106.367, "dur": 3.321, "args": { "External id": 18792,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650789111.446, "dur": 25.129, "args": { "External id": 18793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789149.576, "dur": 2.937, "args": { "External id": 18794,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789150.756, "dur": 1.658, "args": { "External id": 18795,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789156.260, "dur": 2.976, "args": { "External id": 18796,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789157.046, "dur": 2.104, "args": { "External id": 18797,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650789173.439, "dur": 2.392, "args": { "External id": 18798,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650789185.921, "dur": 3.371, "args": { "External id": 18799,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789356.302, "dur": 3.709, "args": { "External id": 18800,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650789364.425, "dur": 34.614, "args": { "External id": 18801,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789374.210, "dur": 0.881, "args": { "External id": 18802,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650789404.784, "dur": 29.787, "args": { "External id": 18803,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650789406.582, "dur": 27.792, "args": { "External id": 18804,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789410.730, "dur": 3.793, "args": { "External id": 18805,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650789418.015, "dur": 15.866, "args": { "External id": 18806,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650789439.214, "dur": 2.697, "args": { "External id": 18807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789440.564, "dur": 1.245, "args": { "External id": 18808,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789448.952, "dur": 2.761, "args": { "External id": 18809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789450.328, "dur": 1.226, "args": { "External id": 18810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789453.863, "dur": 4.251, "args": { "External id": 18811,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789455.161, "dur": 2.857, "args": { "External id": 18812,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650789483.096, "dur": 17.753, "args": { "External id": 18813,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1404 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789513.983, "dur": 8.780, "args": { "External id": 18814,"Record function id": 0, "Ev Idx": 1405 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789516.366, "dur": 5.700, "args": { "External id": 18815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789518.353, "dur": 2.811, "args": { "External id": 18816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1407 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789519.465, "dur": 1.607, "args": { "External id": 18817,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1408 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789526.367, "dur": 10.043, "args": { "External id": 18818,"Record function id": 0, "Sequence number": 246620, "Fwd thread id": 1, "Ev Idx": 1409 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789528.132, "dur": 5.773, "args": { "External id": 18819,"Sequence number": 246620, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1410 } }, { "ph": "f", "id": 148, "pid": 1336754, "tid": 1381179, "ts": 1295650789528.132, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789529.919, "dur": 3.826, "args": { "External id": 18820,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789532.569, "dur": 1.048, "args": { "External id": 18821,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1412 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789539.892, "dur": 128.049, "args": { "External id": 18822,"Record function id": 0, "Sequence number": 246619, "Fwd thread id": 1, "Ev Idx": 1413 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789540.769, "dur": 121.699, "args": { "External id": 18823,"Sequence number": 246619, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1414 } }, { "ph": "f", "id": 149, "pid": 1336754, "tid": 1381179, "ts": 1295650789540.769, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650789543.068, "dur": 4.786, "args": { "External id": 18824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650789544.410, "dur": 2.933, "args": { "External id": 18825,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789546.426, "dur": 0.725, "args": { "External id": 18826,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650789548.995, "dur": 57.391, "args": { "External id": 18827,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650789609.655, "dur": 4.660, "args": { "External id": 18828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650789610.481, "dur": 3.276, "args": { "External id": 18829,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789612.046, "dur": 1.546, "args": { "External id": 18830,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650789615.654, "dur": 3.907, "args": { "External id": 18831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650789616.798, "dur": 2.323, "args": { "External id": 18832,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789618.635, "dur": 0.387, "args": { "External id": 18833,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650789621.982, "dur": 39.590, "args": { "External id": 18834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1425 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789672.919, "dur": 8.413, "args": { "External id": 18835,"Record function id": 0, "Sequence number": 246618, "Fwd thread id": 1, "Ev Idx": 1426 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789673.872, "dur": 5.805, "args": { "External id": 18836,"Sequence number": 246618, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1427 } }, { "ph": "f", "id": 150, "pid": 1336754, "tid": 1381179, "ts": 1295650789673.872, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789675.895, "dur": 3.631, "args": { "External id": 18837,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789677.177, "dur": 2.238, "args": { "External id": 18838,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1429 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789684.634, "dur": 9.964, "args": { "External id": 18839,"Record function id": 0, "Sequence number": 246617, "Fwd thread id": 1, "Ev Idx": 1430 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789685.652, "dur": 7.060, "args": { "External id": 18840,"Sequence number": 246617, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1431 } }, { "ph": "f", "id": 151, "pid": 1336754, "tid": 1381179, "ts": 1295650789685.652, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650789686.668, "dur": 5.824, "args": { "External id": 18841,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650789687.317, "dur": 4.629, "args": { "External id": 18842,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789691.164, "dur": 0.682, "args": { "External id": 18843,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1434 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789698.650, "dur": 4.959, "args": { "External id": 18844,"Record function id": 0, "Ev Idx": 1435 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650789700.346, "dur": 2.754, "args": { "External id": 18845,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789701.286, "dur": 1.581, "args": { "External id": 18846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1437 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650789701.908, "dur": 0.875, "args": { "External id": 18847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1438 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789706.489, "dur": 5.629, "args": { "External id": 18848,"Record function id": 0, "Sequence number": 246616, "Fwd thread id": 1, "Ev Idx": 1439 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650789707.326, "dur": 3.276, "args": { "External id": 18849,"Sequence number": 246616, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1440 } }, { "ph": "f", "id": 152, "pid": 1336754, "tid": 1381179, "ts": 1295650789707.326, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650789708.556, "dur": 1.889, "args": { "External id": 18850,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650789709.252, "dur": 1.063, "args": { "External id": 18851,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1442 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650789716.389, "dur": 265.277, "args": { "External id": 18852,"Record function id": 0, "Sequence number": 246615, "Fwd thread id": 1, "Ev Idx": 1443 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFuncBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650789717.799, "dur": 248.999, "args": { "External id": 18853,"Sequence number": 246615, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1444 } }, { "ph": "f", "id": 153, "pid": 1336754, "tid": 1381179, "ts": 1295650789717.799, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650789731.468, "dur": 6.466, "args": { "External id": 18854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789734.247, "dur": 3.203, "args": { "External id": 18855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650789739.803, "dur": 4.298, "args": { "External id": 18856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789741.776, "dur": 2.143, "args": { "External id": 18857,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650789745.420, "dur": 3.626, "args": { "External id": 18858,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650789747.256, "dur": 1.597, "args": { "External id": 18859,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1450 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650789771.561, "dur": 171.067, "args": { "External id": 18860,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650789847.227, "dur": 4.040, "args": { "External id": 18861,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650789853.075, "dur": 4.080, "args": { "External id": 18862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650789954.646, "dur": 3.414, "args": { "External id": 18863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650789961.047, "dur": 0.641, "args": { "External id": 18864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1381179, "ts": 1295650789963.460, "dur": 0.904, "args": { "External id": 18865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1456 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650790032.639, "dur": 258.509, "args": { "External id": 18866,"Record function id": 0, "Sequence number": 246614, "Fwd thread id": 1, "Ev Idx": 1457 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650790035.464, "dur": 247.351, "args": { "External id": 18867,"Sequence number": 246614, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1458 } }, { "ph": "f", "id": 154, "pid": 1336754, "tid": 1381179, "ts": 1295650790035.464, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650790056.341, "dur": 53.225, "args": { "External id": 18868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790059.916, "dur": 4.439, "args": { "External id": 18869,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650790066.169, "dur": 42.888, "args": { "External id": 18870,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650790119.523, "dur": 4.565, "args": { "External id": 18871,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790121.403, "dur": 2.306, "args": { "External id": 18872,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1463 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650790300.738, "dur": 161.307, "args": { "External id": 18873,"Record function id": 0, "Sequence number": 246613, "Fwd thread id": 1, "Ev Idx": 1464 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650790303.118, "dur": 153.115, "args": { "External id": 18874,"Sequence number": 246613, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1465 } }, { "ph": "f", "id": 155, "pid": 1336754, "tid": 1381179, "ts": 1295650790303.118, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1381179, "ts": 1295650790316.460, "dur": 37.546, "args": { "External id": 18875,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790319.548, "dur": 3.681, "args": { "External id": 18876,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650790324.173, "dur": 29.308, "args": { "External id": 18877,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], []], "Ev Idx": 1468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1381179, "ts": 1295650790361.543, "dur": 5.037, "args": { "External id": 18878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 1469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790363.745, "dur": 2.360, "args": { "External id": 18879,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790467.956, "dur": 15.116, "args": { "External id": 18880,"Record function id": 0, "Sequence number": 246612, "Fwd thread id": 1, "Ev Idx": 1471 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790469.476, "dur": 11.467, "args": { "External id": 18881,"Sequence number": 246612, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1472 } }, { "ph": "f", "id": 156, "pid": 1336754, "tid": 1381179, "ts": 1295650790469.476, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790472.036, "dur": 8.636, "args": { "External id": 18882,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790473.620, "dur": 6.853, "args": { "External id": 18883,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790486.625, "dur": 7.055, "args": { "External id": 18884,"Record function id": 0, "Sequence number": 246611, "Fwd thread id": 1, "Ev Idx": 1475 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790487.983, "dur": 3.808, "args": { "External id": 18885,"Sequence number": 246611, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1476 } }, { "ph": "f", "id": 157, "pid": 1336754, "tid": 1381179, "ts": 1295650790487.983, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790489.496, "dur": 2.153, "args": { "External id": 18886,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790490.602, "dur": 0.945, "args": { "External id": 18887,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790496.801, "dur": 8.022, "args": { "External id": 18888,"Record function id": 0, "Sequence number": 246610, "Fwd thread id": 1, "Ev Idx": 1479 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790497.700, "dur": 5.805, "args": { "External id": 18889,"Sequence number": 246610, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 1480 } }, { "ph": "f", "id": 158, "pid": 1336754, "tid": 1381179, "ts": 1295650790497.700, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790501.353, "dur": 2.016, "args": { "External id": 18890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790502.491, "dur": 0.755, "args": { "External id": 18891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 1482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790508.289, "dur": 6.499, "args": { "External id": 18892,"Record function id": 0, "Sequence number": 246609, "Fwd thread id": 1, "Ev Idx": 1483 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790509.698, "dur": 3.222, "args": { "External id": 18893,"Sequence number": 246609, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1484 } }, { "ph": "f", "id": 159, "pid": 1336754, "tid": 1381179, "ts": 1295650790509.698, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790510.839, "dur": 1.940, "args": { "External id": 18894,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790511.835, "dur": 0.847, "args": { "External id": 18895,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790518.091, "dur": 145.087, "args": { "External id": 18896,"Record function id": 0, "Sequence number": 246608, "Fwd thread id": 1, "Ev Idx": 1487 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790519.113, "dur": 137.921, "args": { "External id": 18897,"Sequence number": 246608, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1488 } }, { "ph": "f", "id": 160, "pid": 1336754, "tid": 1381179, "ts": 1295650790519.113, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790522.324, "dur": 8.798, "args": { "External id": 18898,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790526.030, "dur": 4.454, "args": { "External id": 18899,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790528.494, "dur": 1.735, "args": { "External id": 18900,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790532.426, "dur": 65.818, "args": { "External id": 18901,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790599.729, "dur": 5.284, "args": { "External id": 18902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790600.757, "dur": 3.536, "args": { "External id": 18903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790602.689, "dur": 1.463, "args": { "External id": 18904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790606.561, "dur": 6.103, "args": { "External id": 18905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790609.581, "dur": 2.630, "args": { "External id": 18906,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790611.585, "dur": 0.547, "args": { "External id": 18907,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790613.192, "dur": 43.137, "args": { "External id": 18908,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1499 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790667.799, "dur": 7.128, "args": { "External id": 18909,"Record function id": 0, "Sequence number": 246607, "Fwd thread id": 1, "Ev Idx": 1500 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790668.808, "dur": 4.563, "args": { "External id": 18910,"Sequence number": 246607, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1501 } }, { "ph": "f", "id": 161, "pid": 1336754, "tid": 1381179, "ts": 1295650790668.808, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790670.509, "dur": 2.712, "args": { "External id": 18911,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790671.945, "dur": 1.117, "args": { "External id": 18912,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1503 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790678.157, "dur": 9.580, "args": { "External id": 18913,"Record function id": 0, "Sequence number": 246606, "Fwd thread id": 1, "Ev Idx": 1504 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790679.127, "dur": 6.609, "args": { "External id": 18914,"Sequence number": 246606, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1505 } }, { "ph": "f", "id": 162, "pid": 1336754, "tid": 1381179, "ts": 1295650790679.127, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790682.081, "dur": 3.415, "args": { "External id": 18915,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790682.844, "dur": 2.132, "args": { "External id": 18916,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790684.427, "dur": 0.436, "args": { "External id": 18917,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1508 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650790693.942, "dur": 9.611, "args": { "External id": 18918,"Record function id": 0, "Ev Idx": 1509 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650790695.899, "dur": 6.909, "args": { "External id": 18919,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650790698.299, "dur": 4.174, "args": { "External id": 18920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1511 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650790699.896, "dur": 2.488, "args": { "External id": 18921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1512 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790707.132, "dur": 8.906, "args": { "External id": 18922,"Record function id": 0, "Sequence number": 246605, "Fwd thread id": 1, "Ev Idx": 1513 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790708.456, "dur": 4.983, "args": { "External id": 18923,"Sequence number": 246605, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1514 } }, { "ph": "f", "id": 163, "pid": 1336754, "tid": 1381179, "ts": 1295650790708.456, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790709.552, "dur": 3.728, "args": { "External id": 18924,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790712.500, "dur": 0.632, "args": { "External id": 18925,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1516 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790718.925, "dur": 86.311, "args": { "External id": 18926,"Record function id": 0, "Sequence number": 246604, "Fwd thread id": 1, "Ev Idx": 1517 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790719.874, "dur": 80.498, "args": { "External id": 18927,"Sequence number": 246604, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1518 } }, { "ph": "f", "id": 164, "pid": 1336754, "tid": 1381179, "ts": 1295650790719.874, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790721.628, "dur": 3.163, "args": { "External id": 18928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790722.342, "dur": 1.832, "args": { "External id": 18929,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790723.578, "dur": 0.456, "args": { "External id": 18930,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790725.417, "dur": 27.903, "args": { "External id": 18931,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790756.579, "dur": 3.807, "args": { "External id": 18932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790757.098, "dur": 2.820, "args": { "External id": 18933,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790758.817, "dur": 0.989, "args": { "External id": 18934,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790761.282, "dur": 4.341, "args": { "External id": 18935,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790762.084, "dur": 3.077, "args": { "External id": 18936,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790763.364, "dur": 1.728, "args": { "External id": 18937,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790767.841, "dur": 31.846, "args": { "External id": 18938,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790811.415, "dur": 35.506, "args": { "External id": 18939,"Record function id": 0, "Sequence number": 246603, "Fwd thread id": 1, "Ev Idx": 1530 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790812.419, "dur": 7.356, "args": { "External id": 18940,"Sequence number": 246603, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1531 } }, { "ph": "f", "id": 165, "pid": 1336754, "tid": 1381179, "ts": 1295650790812.419, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790814.354, "dur": 5.270, "args": { "External id": 18941,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790818.518, "dur": 1.006, "args": { "External id": 18942,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1381179, "ts": 1295650790822.709, "dur": 22.084, "args": { "External id": 18943,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1534 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790850.531, "dur": 30.836, "args": { "External id": 18944,"Record function id": 0, "Sequence number": 246602, "Fwd thread id": 1, "Ev Idx": 1535 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790872.303, "dur": 6.667, "args": { "External id": 18945,"Sequence number": 246602, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1536 } }, { "ph": "f", "id": 166, "pid": 1336754, "tid": 1381179, "ts": 1295650790872.303, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790875.547, "dur": 3.205, "args": { "External id": 18946,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790876.183, "dur": 2.035, "args": { "External id": 18947,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790877.613, "dur": 0.473, "args": { "External id": 18948,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1539 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650790885.392, "dur": 4.549, "args": { "External id": 18949,"Record function id": 0, "Ev Idx": 1540 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650790886.916, "dur": 2.542, "args": { "External id": 18950,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650790887.765, "dur": 1.457, "args": { "External id": 18951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1542 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650790888.235, "dur": 0.873, "args": { "External id": 18952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1543 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790893.375, "dur": 8.328, "args": { "External id": 18953,"Record function id": 0, "Sequence number": 246601, "Fwd thread id": 1, "Ev Idx": 1544 } }, { "ph": "X", "cat": "cpu_op", "name": "UnsafeViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790894.697, "dur": 5.284, "args": { "External id": 18954,"Sequence number": 246601, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1545 } }, { "ph": "f", "id": 167, "pid": 1336754, "tid": 1381179, "ts": 1295650790894.697, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650790895.692, "dur": 4.160, "args": { "External id": 18955,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650790898.910, "dur": 0.841, "args": { "External id": 18956,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1547 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790904.920, "dur": 131.946, "args": { "External id": 18957,"Record function id": 0, "Sequence number": 246600, "Fwd thread id": 1, "Ev Idx": 1548 } }, { "ph": "X", "cat": "cpu_op", "name": "MmBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650790905.550, "dur": 122.555, "args": { "External id": 18958,"Sequence number": 246600, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1549 } }, { "ph": "f", "id": 168, "pid": 1336754, "tid": 1381179, "ts": 1295650790905.550, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790907.600, "dur": 2.802, "args": { "External id": 18959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790908.081, "dur": 1.827, "args": { "External id": 18960,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[65536, 2048], [], []], "Ev Idx": 1551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790909.440, "dur": 0.374, "args": { "External id": 18961,"Record function id": 0, "Concrete Inputs": ["", "[2048, 65536]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 1552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790910.950, "dur": 31.174, "args": { "External id": 18962,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048]], "Ev Idx": 1553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790944.877, "dur": 3.435, "args": { "External id": 18963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790945.326, "dur": 2.352, "args": { "External id": 18964,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790947.138, "dur": 0.421, "args": { "External id": 18965,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650790949.254, "dur": 3.285, "args": { "External id": 18966,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650790950.283, "dur": 1.838, "args": { "External id": 18967,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650790951.805, "dur": 0.219, "args": { "External id": 18968,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650790955.242, "dur": 71.321, "args": { "External id": 18969,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 1560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650791043.916, "dur": 28.977, "args": { "External id": 18970,"Record function id": 0, "Sequence number": 246599, "Fwd thread id": 1, "Ev Idx": 1561 } }, { "ph": "X", "cat": "cpu_op", "name": "ViewBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650791044.980, "dur": 4.526, "args": { "External id": 18971,"Sequence number": 246599, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 1562 } }, { "ph": "f", "id": 169, "pid": 1336754, "tid": 1381179, "ts": 1295650791044.980, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650791046.580, "dur": 2.760, "args": { "External id": 18972,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650791047.496, "dur": 1.733, "args": { "External id": 18973,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650791051.926, "dur": 18.928, "args": { "External id": 18974,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1565 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650791076.362, "dur": 9.049, "args": { "External id": 18975,"Record function id": 0, "Sequence number": 246598, "Fwd thread id": 1, "Ev Idx": 1566 } }, { "ph": "X", "cat": "cpu_op", "name": "TBackward0", "pid": 1336754, "tid": 1381179, "ts": 1295650791077.189, "dur": 6.464, "args": { "External id": 18976,"Sequence number": 246598, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1567 } }, { "ph": "f", "id": 170, "pid": 1336754, "tid": 1381179, "ts": 1295650791077.189, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1381179, "ts": 1295650791077.836, "dur": 5.609, "args": { "External id": 18977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1, 2048]], "Input Dims": [[2048, 2048]], "Ev Idx": 1568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1381179, "ts": 1295650791078.705, "dur": 4.102, "args": { "External id": 18978,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[1, 2048], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 1569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791082.086, "dur": 0.605, "args": { "External id": 18979,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[2048, 1]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 2048], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 1570 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650791089.658, "dur": 5.796, "args": { "External id": 18980,"Record function id": 0, "Ev Idx": 1571 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650791091.485, "dur": 3.459, "args": { "External id": 18981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650791092.597, "dur": 2.043, "args": { "External id": 18982,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1573 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650791093.153, "dur": 1.403, "args": { "External id": 18983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1574 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650791099.751, "dur": 366.817, "args": { "External id": 18984,"Record function id": 0, "Sequence number": 246597, "Fwd thread id": 1, "Ev Idx": 1575 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650791101.686, "dur": 330.688, "args": { "External id": 18985,"Sequence number": 246597, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1576 } }, { "ph": "f", "id": 171, "pid": 1336754, "tid": 1381179, "ts": 1295650791101.686, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650791133.235, "dur": 2.122, "args": { "External id": 18986,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650791134.117, "dur": 1.125, "args": { "External id": 18987,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 1578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650791150.788, "dur": 5.299, "args": { "External id": 18988,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650791165.230, "dur": 1.924, "args": { "External id": 18989,"Record function id": 0, "Concrete Inputs": ["[132, 2048]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650791330.131, "dur": 2.623, "args": { "External id": 18990,"Record function id": 0, "Concrete Inputs": ["", "[1, -1, 2048]"], "Input type": ["float", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[132, 2048], []], "Ev Idx": 1581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1381179, "ts": 1295650791336.869, "dur": 36.606, "args": { "External id": 18991,"Record function id": 0, "Concrete Inputs": ["", "[1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[270336, 2048, 1], [], [], []], "Input Dims": [[1, 132, 2048], [], [], []], "Ev Idx": 1582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791347.530, "dur": 0.673, "args": { "External id": 18992,"Record function id": 0, "Concrete Inputs": ["", "[1, 1, 2048]", "[2048, 0, 1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[1, 2048], [], [], []], "Ev Idx": 1583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650791378.805, "dur": 31.784, "args": { "External id": 18993,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], []], "Ev Idx": 1584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650791380.409, "dur": 29.980, "args": { "External id": 18994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[1, 2048], [], [], [], [], [], []], "Ev Idx": 1585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791384.749, "dur": 4.153, "args": { "External id": 18995,"Record function id": 0, "Concrete Inputs": ["[1, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650791392.624, "dur": 17.285, "args": { "External id": 18996,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[1, 2048], [1, 2048], []], "Ev Idx": 1587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1381179, "ts": 1295650791414.859, "dur": 2.862, "args": { "External id": 18997,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1]], "Input Dims": [[1, 2048], [2048]], "Ev Idx": 1588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650791416.449, "dur": 1.177, "args": { "External id": 18998,"Record function id": 0, "Concrete Inputs": ["", "[2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[1, 2048], []], "Ev Idx": 1589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1381179, "ts": 1295650791423.792, "dur": 1.846, "args": { "External id": 18999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650791424.693, "dur": 0.862, "args": { "External id": 19000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 1591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1381179, "ts": 1295650791445.030, "dur": 16.474, "args": { "External id": 19001,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 1592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650791477.390, "dur": 10.345, "args": { "External id": 19002,"Record function id": 0, "Ev Idx": 1593 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650791480.005, "dur": 6.987, "args": { "External id": 19003,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650791481.689, "dur": 4.346, "args": { "External id": 19004,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1595 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650791484.421, "dur": 1.513, "args": { "External id": 19005,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1596 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650791492.367, "dur": 2597.841, "args": { "External id": 19006,"Record function id": 0, "Ev Idx": 1597 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.27)", "pid": 1336754, "tid": 1381179, "ts": 1295650791521.859, "dur": 872.079, "args": { "External id": 19007,"Record function id": 0, "Ev Idx": 1598 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.26", "pid": 1336754, "tid": 1381179, "ts": 1295650791545.620, "dur": 839.031, "args": { "External id": 19008,"Record function id": 0, "Ev Idx": 1599 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650791558.360, "dur": 810.952, "args": { "External id": 19009,"Record function id": 0, "Ev Idx": 1600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650791633.292, "dur": 5.873, "args": { "External id": 19010,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295650791655.004, "dur": 28.078, "args": { "External id": 19011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791659.255, "dur": 1.123, "args": { "External id": 19012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791662.412, "dur": 1.430, "args": { "External id": 19013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791665.876, "dur": 0.353, "args": { "External id": 19014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791667.716, "dur": 0.176, "args": { "External id": 19015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791669.179, "dur": 0.251, "args": { "External id": 19016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791670.873, "dur": 0.383, "args": { "External id": 19017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791672.847, "dur": 0.691, "args": { "External id": 19018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791675.513, "dur": 0.423, "args": { "External id": 19019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791677.739, "dur": 0.416, "args": { "External id": 19020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650791698.840, "dur": 33.453, "args": { "External id": 19021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1612 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295650791767.346, "dur": 107.293, "args": { "External id": 19022,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650791777.772, "dur": 5.666, "args": { "External id": 19023,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295650791788.481, "dur": 10.064, "args": { "External id": 19024,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650791792.264, "dur": 5.922, "args": { "External id": 19025,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791796.372, "dur": 0.603, "args": { "External id": 19026,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295650791805.703, "dur": 25.628, "args": { "External id": 19027,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791808.035, "dur": 0.470, "args": { "External id": 19028,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791810.561, "dur": 0.404, "args": { "External id": 19029,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791812.775, "dur": 0.535, "args": { "External id": 19030,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791814.884, "dur": 0.368, "args": { "External id": 19031,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791816.910, "dur": 0.343, "args": { "External id": 19032,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791818.769, "dur": 0.366, "args": { "External id": 19033,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791820.672, "dur": 1.141, "args": { "External id": 19034,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791823.843, "dur": 0.358, "args": { "External id": 19035,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650791826.209, "dur": 0.556, "args": { "External id": 19036,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650791842.090, "dur": 24.772, "args": { "External id": 19037,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1628 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295650791928.142, "dur": 340.426, "args": { "External id": 19038,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1629 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650791955.282, "dur": 307.869, "args": { "External id": 19039,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1630, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295650791965.866, "dur": 290.927, "args": { "External id": 19040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1631 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650792292.171, "dur": 2.792, "args": { "External id": 19041,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1632, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650792401.217, "dur": 1669.021, "args": { "External id": 19042,"Sequence number": 246596, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1633 } }, { "ph": "f", "id": 172, "pid": 1336754, "tid": 1381179, "ts": 1295650792401.217, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650792516.065, "dur": 108.207, "args": { "External id": 19043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1634 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295650792665.522, "dur": 41.029, "args": { "External id": 19044,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650792725.475, "dur": 47.264, "args": { "External id": 19045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650792781.629, "dur": 33.051, "args": { "External id": 19046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650792820.857, "dur": 44.090, "args": { "External id": 19047,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650792872.438, "dur": 29.995, "args": { "External id": 19048,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650792909.773, "dur": 42.283, "args": { "External id": 19049,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295650792975.964, "dur": 61.824, "args": { "External id": 19050,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1641 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295650793060.712, "dur": 32.375, "args": { "External id": 19051,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1642 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295650793117.990, "dur": 22.128, "args": { "External id": 19052,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1643 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295650793156.285, "dur": 17.801, "args": { "External id": 19053,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793185.931, "dur": 38.827, "args": { "External id": 19054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793245.186, "dur": 42.404, "args": { "External id": 19055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1646 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650793319.812, "dur": 179.569, "args": { "External id": 19056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650793401.945, "dur": 5.327, "args": { "External id": 19057,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650793409.434, "dur": 2.759, "args": { "External id": 19058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1649 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295650793531.192, "dur": 27.567, "args": { "External id": 19059,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1650 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295650793571.357, "dur": 15.825, "args": { "External id": 19060,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793596.057, "dur": 40.949, "args": { "External id": 19061,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793643.867, "dur": 36.170, "args": { "External id": 19062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793687.140, "dur": 23.687, "args": { "External id": 19063,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793717.278, "dur": 31.003, "args": { "External id": 19064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793755.201, "dur": 22.756, "args": { "External id": 19065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650793785.992, "dur": 31.461, "args": { "External id": 19066,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1657 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295650793835.340, "dur": 24.855, "args": { "External id": 19067,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1658 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295650793878.495, "dur": 25.483, "args": { "External id": 19068,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1659 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295650793919.198, "dur": 18.807, "args": { "External id": 19069,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1660 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295650793950.996, "dur": 15.074, "args": { "External id": 19070,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1661 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295650793980.947, "dur": 57.812, "args": { "External id": 19071,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794113.157, "dur": 15.853, "args": { "External id": 19072,"Record function id": 0, "Ev Idx": 1663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794117.042, "dur": 10.890, "args": { "External id": 19073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794121.160, "dur": 5.809, "args": { "External id": 19074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794123.121, "dur": 3.712, "args": { "External id": 19075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794132.983, "dur": 5.570, "args": { "External id": 19076,"Record function id": 0, "Ev Idx": 1667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794134.842, "dur": 3.163, "args": { "External id": 19077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794135.731, "dur": 1.779, "args": { "External id": 19078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794136.579, "dur": 0.845, "args": { "External id": 19079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794142.306, "dur": 5.393, "args": { "External id": 19080,"Record function id": 0, "Ev Idx": 1671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794144.282, "dur": 3.027, "args": { "External id": 19081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794145.039, "dur": 1.813, "args": { "External id": 19082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794145.648, "dur": 1.126, "args": { "External id": 19083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794151.102, "dur": 5.474, "args": { "External id": 19084,"Record function id": 0, "Ev Idx": 1675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794152.551, "dur": 3.524, "args": { "External id": 19085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794153.373, "dur": 2.225, "args": { "External id": 19086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794153.824, "dur": 1.685, "args": { "External id": 19087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794159.924, "dur": 4.166, "args": { "External id": 19088,"Record function id": 0, "Ev Idx": 1679 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794161.691, "dur": 2.009, "args": { "External id": 19089,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794162.164, "dur": 1.144, "args": { "External id": 19090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1681 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794162.541, "dur": 0.676, "args": { "External id": 19091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1682 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794167.543, "dur": 4.494, "args": { "External id": 19092,"Record function id": 0, "Ev Idx": 1683 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794169.377, "dur": 2.223, "args": { "External id": 19093,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794169.962, "dur": 1.202, "args": { "External id": 19094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1685 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794170.497, "dur": 0.577, "args": { "External id": 19095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1686 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794175.999, "dur": 4.241, "args": { "External id": 19096,"Record function id": 0, "Ev Idx": 1687 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794177.635, "dur": 2.191, "args": { "External id": 19097,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794178.168, "dur": 1.259, "args": { "External id": 19098,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1689 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794178.605, "dur": 0.726, "args": { "External id": 19099,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1690 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794183.673, "dur": 3.870, "args": { "External id": 19100,"Record function id": 0, "Ev Idx": 1691 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794185.143, "dur": 2.014, "args": { "External id": 19101,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794185.624, "dur": 1.145, "args": { "External id": 19102,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1693 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794185.886, "dur": 0.820, "args": { "External id": 19103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1694 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794190.946, "dur": 4.922, "args": { "External id": 19104,"Record function id": 0, "Ev Idx": 1695 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650794192.714, "dur": 2.757, "args": { "External id": 19105,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794193.643, "dur": 1.304, "args": { "External id": 19106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1697 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650794194.389, "dur": 0.468, "args": { "External id": 19107,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1698 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650794201.031, "dur": 173362.729, "args": { "External id": 19108,"Record function id": 0, "Sequence number": 246595, "Fwd thread id": 1, "Ev Idx": 1699 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650794202.415, "dur": 173352.809, "args": { "External id": 19109,"Sequence number": 246595, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1700 } }, { "ph": "f", "id": 173, "pid": 1336754, "tid": 1381179, "ts": 1295650794202.415, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.27)", "pid": 1336754, "tid": 1381179, "ts": 1295650794247.627, "dur": 41.525, "args": { "External id": 19110,"Record function id": 0, "Ev Idx": 1701 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.27)", "pid": 1336754, "tid": 1381179, "ts": 1295650794296.796, "dur": 71.324, "args": { "External id": 19111,"Record function id": 0, "Ev Idx": 1702 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.27)", "pid": 1336754, "tid": 1381179, "ts": 1295650794373.901, "dur": 173172.267, "args": { "External id": 19112,"Record function id": 0, "Ev Idx": 1703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650794429.035, "dur": 7.893, "args": { "External id": 19113,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650794446.715, "dur": 5.371, "args": { "External id": 19114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1705 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295650794467.810, "dur": 172155.854, "args": { "External id": 19115,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295650794482.411, "dur": 172129.162, "args": { "External id": 19116,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650794586.897, "dur": 5.975, "args": { "External id": 19117,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650794604.160, "dur": 171941.931, "args": { "External id": 19118,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650794606.799, "dur": 171938.194, "args": { "External id": 19119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650794613.960, "dur": 6.920, "args": { "External id": 19120,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650794622.734, "dur": 171916.656, "args": { "External id": 19121,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295650966737.937, "dur": 13.173, "args": { "External id": 19122,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650966742.091, "dur": 8.659, "args": { "External id": 19123,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295650966790.468, "dur": 398.239, "args": { "External id": 19124,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650966817.975, "dur": 365.270, "args": { "External id": 19125,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1716, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295650966830.363, "dur": 346.635, "args": { "External id": 19126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650967209.877, "dur": 2.478, "args": { "External id": 19127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1718, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967295.501, "dur": 10.580, "args": { "External id": 19128,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967364.562, "dur": 1.459, "args": { "External id": 19129,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967385.893, "dur": 0.961, "args": { "External id": 19130,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967401.798, "dur": 1.542, "args": { "External id": 19131,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967420.357, "dur": 1.322, "args": { "External id": 19132,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967434.041, "dur": 1.270, "args": { "External id": 19133,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967448.329, "dur": 1.155, "args": { "External id": 19134,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967463.628, "dur": 3.345, "args": { "External id": 19135,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967479.185, "dur": 1.047, "args": { "External id": 19136,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1727 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650967580.261, "dur": 2849.972, "args": { "External id": 19137,"Record function id": 0, "Ev Idx": 1728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650967599.271, "dur": 1072.397, "args": { "External id": 19138,"Record function id": 0, "Ev Idx": 1729 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650967615.121, "dur": 325.233, "args": { "External id": 19139,"Record function id": 0, "Ev Idx": 1730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967691.221, "dur": 4.076, "args": { "External id": 19140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967698.805, "dur": 1.333, "args": { "External id": 19141,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967702.124, "dur": 1.044, "args": { "External id": 19142,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967704.762, "dur": 1.788, "args": { "External id": 19143,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967708.170, "dur": 0.768, "args": { "External id": 19144,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967710.540, "dur": 0.989, "args": { "External id": 19145,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967713.660, "dur": 2.729, "args": { "External id": 19146,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967717.998, "dur": 1.136, "args": { "External id": 19147,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967720.678, "dur": 1.168, "args": { "External id": 19148,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650967723.335, "dur": 0.934, "args": { "External id": 19149,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1740 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650967742.563, "dur": 164.075, "args": { "External id": 19150,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650967759.415, "dur": 142.357, "args": { "External id": 19151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650967783.018, "dur": 12.965, "args": { "External id": 19152,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650967799.391, "dur": 71.262, "args": { "External id": 19153,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650967802.250, "dur": 68.032, "args": { "External id": 19154,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650967806.982, "dur": 7.822, "args": { "External id": 19155,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650967816.639, "dur": 52.928, "args": { "External id": 19156,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1747 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.25", "pid": 1336754, "tid": 1381179, "ts": 1295650968071.722, "dur": 591.324, "args": { "External id": 19157,"Record function id": 0, "Ev Idx": 1748 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295650968091.748, "dur": 558.083, "args": { "External id": 19158,"Record function id": 0, "Ev Idx": 1749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650968150.101, "dur": 6.369, "args": { "External id": 19159,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295650968173.652, "dur": 31.432, "args": { "External id": 19160,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968178.816, "dur": 1.749, "args": { "External id": 19161,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968183.471, "dur": 0.505, "args": { "External id": 19162,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968185.737, "dur": 0.459, "args": { "External id": 19163,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968188.070, "dur": 0.572, "args": { "External id": 19164,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968190.296, "dur": 0.334, "args": { "External id": 19165,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968192.542, "dur": 0.339, "args": { "External id": 19166,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968194.403, "dur": 1.312, "args": { "External id": 19167,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968197.427, "dur": 0.441, "args": { "External id": 19168,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968199.684, "dur": 0.362, "args": { "External id": 19169,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650968219.884, "dur": 51.391, "args": { "External id": 19170,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1761 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295650968308.698, "dur": 111.284, "args": { "External id": 19171,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650968320.668, "dur": 4.057, "args": { "External id": 19172,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295650968330.223, "dur": 10.470, "args": { "External id": 19173,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295650968334.360, "dur": 5.940, "args": { "External id": 19174,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968338.183, "dur": 0.571, "args": { "External id": 19175,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295650968349.333, "dur": 24.765, "args": { "External id": 19176,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968351.846, "dur": 0.370, "args": { "External id": 19177,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968354.265, "dur": 0.411, "args": { "External id": 19178,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968356.361, "dur": 0.498, "args": { "External id": 19179,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968358.750, "dur": 1.248, "args": { "External id": 19180,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968361.882, "dur": 0.477, "args": { "External id": 19181,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968363.818, "dur": 0.278, "args": { "External id": 19182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968366.019, "dur": 0.373, "args": { "External id": 19183,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968368.253, "dur": 0.390, "args": { "External id": 19184,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650968370.014, "dur": 0.341, "args": { "External id": 19185,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650968387.457, "dur": 24.347, "args": { "External id": 19186,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1777 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295650968467.124, "dur": 115.996, "args": { "External id": 19187,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1778 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650968490.278, "dur": 89.270, "args": { "External id": 19188,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1779, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295650968503.423, "dur": 72.142, "args": { "External id": 19189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1780 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295650968597.999, "dur": 1.731, "args": { "External id": 19190,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1781, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650968678.727, "dur": 1730.757, "args": { "External id": 19191,"Sequence number": 246594, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1782 } }, { "ph": "f", "id": 174, "pid": 1336754, "tid": 1381179, "ts": 1295650968678.727, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650968784.441, "dur": 106.348, "args": { "External id": 19192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1783 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295650968932.927, "dur": 44.201, "args": { "External id": 19193,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295650969039.754, "dur": 64.762, "args": { "External id": 19194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969114.619, "dur": 41.245, "args": { "External id": 19195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969164.376, "dur": 48.353, "args": { "External id": 19196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969220.480, "dur": 47.409, "args": { "External id": 19197,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969278.922, "dur": 46.560, "args": { "External id": 19198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295650969351.574, "dur": 24.441, "args": { "External id": 19199,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1790 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295650969397.669, "dur": 28.982, "args": { "External id": 19200,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1791 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295650969447.661, "dur": 22.464, "args": { "External id": 19201,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1792 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295650969484.622, "dur": 16.673, "args": { "External id": 19202,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969509.974, "dur": 31.369, "args": { "External id": 19203,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969544.932, "dur": 34.054, "args": { "External id": 19204,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1795 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295650969608.645, "dur": 166.549, "args": { "External id": 19205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650969687.328, "dur": 5.731, "args": { "External id": 19206,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650969694.997, "dur": 2.078, "args": { "External id": 19207,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1798 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295650969815.148, "dur": 26.018, "args": { "External id": 19208,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1799 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295650969854.496, "dur": 15.940, "args": { "External id": 19209,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969879.196, "dur": 36.765, "args": { "External id": 19210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969922.707, "dur": 35.758, "args": { "External id": 19211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650969968.223, "dur": 58.980, "args": { "External id": 19212,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650970036.145, "dur": 56.807, "args": { "External id": 19213,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650970106.594, "dur": 24.360, "args": { "External id": 19214,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295650970138.924, "dur": 30.273, "args": { "External id": 19215,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1806 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295650970190.187, "dur": 28.169, "args": { "External id": 19216,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1807 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295650970250.592, "dur": 29.955, "args": { "External id": 19217,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1808 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295650970296.639, "dur": 18.701, "args": { "External id": 19218,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1809 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295650970330.523, "dur": 16.234, "args": { "External id": 19219,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1810 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295650970362.368, "dur": 17.173, "args": { "External id": 19220,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970453.275, "dur": 14.978, "args": { "External id": 19221,"Record function id": 0, "Ev Idx": 1812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970456.296, "dur": 10.813, "args": { "External id": 19222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970460.474, "dur": 5.649, "args": { "External id": 19223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970462.231, "dur": 3.758, "args": { "External id": 19224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970472.090, "dur": 4.578, "args": { "External id": 19225,"Record function id": 0, "Ev Idx": 1816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970473.373, "dur": 2.878, "args": { "External id": 19226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970474.079, "dur": 1.681, "args": { "External id": 19227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970474.784, "dur": 0.867, "args": { "External id": 19228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970479.851, "dur": 4.009, "args": { "External id": 19229,"Record function id": 0, "Ev Idx": 1820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970480.986, "dur": 2.483, "args": { "External id": 19230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970481.491, "dur": 1.488, "args": { "External id": 19231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970481.897, "dur": 1.016, "args": { "External id": 19232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970487.050, "dur": 5.288, "args": { "External id": 19233,"Record function id": 0, "Ev Idx": 1824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970488.276, "dur": 3.643, "args": { "External id": 19234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970489.200, "dur": 2.262, "args": { "External id": 19235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970489.806, "dur": 1.572, "args": { "External id": 19236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970495.518, "dur": 3.911, "args": { "External id": 19237,"Record function id": 0, "Ev Idx": 1828 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970497.005, "dur": 2.030, "args": { "External id": 19238,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970497.662, "dur": 0.928, "args": { "External id": 19239,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1830 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970497.951, "dur": 0.558, "args": { "External id": 19240,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1831 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970502.703, "dur": 3.459, "args": { "External id": 19241,"Record function id": 0, "Ev Idx": 1832 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970503.819, "dur": 1.950, "args": { "External id": 19242,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970504.302, "dur": 1.013, "args": { "External id": 19243,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1834 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970504.726, "dur": 0.492, "args": { "External id": 19244,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1835 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970509.407, "dur": 3.371, "args": { "External id": 19245,"Record function id": 0, "Ev Idx": 1836 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970510.557, "dur": 1.805, "args": { "External id": 19246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970511.070, "dur": 0.856, "args": { "External id": 19247,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1838 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970511.346, "dur": 0.480, "args": { "External id": 19248,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1839 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970515.897, "dur": 3.965, "args": { "External id": 19249,"Record function id": 0, "Ev Idx": 1840 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970516.970, "dur": 2.477, "args": { "External id": 19250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970517.567, "dur": 1.453, "args": { "External id": 19251,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1842 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970518.190, "dur": 0.765, "args": { "External id": 19252,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1843 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970522.900, "dur": 4.022, "args": { "External id": 19253,"Record function id": 0, "Ev Idx": 1844 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295650970524.162, "dur": 2.368, "args": { "External id": 19254,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970524.861, "dur": 1.241, "args": { "External id": 19255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1846 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295650970525.491, "dur": 0.526, "args": { "External id": 19256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1847 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650970530.717, "dur": 36829.746, "args": { "External id": 19257,"Record function id": 0, "Sequence number": 246593, "Fwd thread id": 1, "Ev Idx": 1848 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295650970532.015, "dur": 36819.398, "args": { "External id": 19258,"Sequence number": 246593, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1849 } }, { "ph": "f", "id": 175, "pid": 1336754, "tid": 1381179, "ts": 1295650970532.015, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650970560.779, "dur": 38.973, "args": { "External id": 19259,"Record function id": 0, "Ev Idx": 1850 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650970607.904, "dur": 62.808, "args": { "External id": 19260,"Record function id": 0, "Ev Idx": 1851 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.26)", "pid": 1336754, "tid": 1381179, "ts": 1295650970676.464, "dur": 36666.162, "args": { "External id": 19261,"Record function id": 0, "Ev Idx": 1852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650970769.882, "dur": 6.343, "args": { "External id": 19262,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295650970785.658, "dur": 4.470, "args": { "External id": 19263,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1854 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295650970804.897, "dur": 35657.607, "args": { "External id": 19264,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295650970818.334, "dur": 35635.403, "args": { "External id": 19265,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 1856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295650970874.970, "dur": 15.046, "args": { "External id": 19266,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295650970897.692, "dur": 35516.306, "args": { "External id": 19267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 1858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295650970900.548, "dur": 35512.752, "args": { "External id": 19268,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 1859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295650970905.012, "dur": 4.734, "args": { "External id": 19269,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295650970911.640, "dur": 35497.859, "args": { "External id": 19270,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 1861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651006552.200, "dur": 9.263, "args": { "External id": 19271,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 1862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651006555.433, "dur": 5.687, "args": { "External id": 19272,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651006592.182, "dur": 383.864, "args": { "External id": 19273,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 1864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651006618.807, "dur": 352.203, "args": { "External id": 19274,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1865, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651006629.924, "dur": 335.698, "args": { "External id": 19275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 1866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651007028.671, "dur": 3.489, "args": { "External id": 19276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1867, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007096.456, "dur": 6.805, "args": { "External id": 19277,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007151.695, "dur": 1.609, "args": { "External id": 19278,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007172.803, "dur": 0.924, "args": { "External id": 19279,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007187.786, "dur": 0.825, "args": { "External id": 19280,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007202.129, "dur": 0.961, "args": { "External id": 19281,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007215.671, "dur": 1.025, "args": { "External id": 19282,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007245.407, "dur": 1.864, "args": { "External id": 19283,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007264.920, "dur": 2.287, "args": { "External id": 19284,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007278.731, "dur": 1.187, "args": { "External id": 19285,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1876 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651007376.412, "dur": 2808.063, "args": { "External id": 19286,"Record function id": 0, "Ev Idx": 1877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295651007395.728, "dur": 1066.707, "args": { "External id": 19287,"Record function id": 0, "Ev Idx": 1878 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295651007412.423, "dur": 331.285, "args": { "External id": 19288,"Record function id": 0, "Ev Idx": 1879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007487.645, "dur": 3.993, "args": { "External id": 19289,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 1880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007495.380, "dur": 1.122, "args": { "External id": 19290,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007498.375, "dur": 1.158, "args": { "External id": 19291,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007501.128, "dur": 2.103, "args": { "External id": 19292,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007504.807, "dur": 0.868, "args": { "External id": 19293,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007507.380, "dur": 1.072, "args": { "External id": 19294,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 1885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007510.040, "dur": 2.336, "args": { "External id": 19295,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 1886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007513.744, "dur": 0.982, "args": { "External id": 19296,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007515.934, "dur": 0.878, "args": { "External id": 19297,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651007518.212, "dur": 0.892, "args": { "External id": 19298,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 1889 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651007540.176, "dur": 172.233, "args": { "External id": 19299,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651007556.295, "dur": 151.692, "args": { "External id": 19300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 1891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651007582.176, "dur": 13.124, "args": { "External id": 19301,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651007598.131, "dur": 76.894, "args": { "External id": 19302,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 1893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651007601.005, "dur": 73.721, "args": { "External id": 19303,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 1894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007605.264, "dur": 8.468, "args": { "External id": 19304,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651007615.655, "dur": 58.462, "args": { "External id": 19305,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 1896 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.24", "pid": 1336754, "tid": 1381179, "ts": 1295651007820.749, "dur": 633.478, "args": { "External id": 19306,"Record function id": 0, "Ev Idx": 1897 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651007836.417, "dur": 604.023, "args": { "External id": 19307,"Record function id": 0, "Ev Idx": 1898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651007890.706, "dur": 4.364, "args": { "External id": 19308,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651007911.104, "dur": 31.077, "args": { "External id": 19309,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007916.226, "dur": 1.310, "args": { "External id": 19310,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007919.695, "dur": 0.346, "args": { "External id": 19311,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007921.815, "dur": 0.532, "args": { "External id": 19312,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007923.985, "dur": 0.373, "args": { "External id": 19313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007926.236, "dur": 0.378, "args": { "External id": 19314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007929.093, "dur": 0.300, "args": { "External id": 19315,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007930.933, "dur": 1.607, "args": { "External id": 19316,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007934.304, "dur": 0.528, "args": { "External id": 19317,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651007936.896, "dur": 0.573, "args": { "External id": 19318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651007951.541, "dur": 67.772, "args": { "External id": 19319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1910 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651008054.885, "dur": 123.582, "args": { "External id": 19320,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 1911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651008065.618, "dur": 5.014, "args": { "External id": 19321,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651008075.770, "dur": 11.071, "args": { "External id": 19322,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651008079.772, "dur": 6.658, "args": { "External id": 19323,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 1914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008083.885, "dur": 0.982, "args": { "External id": 19324,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 1915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651008094.589, "dur": 40.279, "args": { "External id": 19325,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 1916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008097.476, "dur": 0.706, "args": { "External id": 19326,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008100.387, "dur": 0.399, "args": { "External id": 19327,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008114.944, "dur": 0.620, "args": { "External id": 19328,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008117.534, "dur": 1.772, "args": { "External id": 19329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008120.821, "dur": 0.607, "args": { "External id": 19330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008123.365, "dur": 0.413, "args": { "External id": 19331,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008125.429, "dur": 0.380, "args": { "External id": 19332,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008127.803, "dur": 0.339, "args": { "External id": 19333,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651008129.616, "dur": 0.424, "args": { "External id": 19334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 1925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651008146.100, "dur": 24.691, "args": { "External id": 19335,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 1926 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651008244.919, "dur": 123.445, "args": { "External id": 19336,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 1927 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651008271.665, "dur": 92.953, "args": { "External id": 19337,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 1928, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651008282.452, "dur": 75.501, "args": { "External id": 19338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 1929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651008384.502, "dur": 1.968, "args": { "External id": 19339,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 1930, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651008469.285, "dur": 1694.912, "args": { "External id": 19340,"Sequence number": 246592, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1931 } }, { "ph": "f", "id": 176, "pid": 1336754, "tid": 1381179, "ts": 1295651008469.285, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651008576.846, "dur": 103.695, "args": { "External id": 19341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 1932 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651008717.950, "dur": 39.441, "args": { "External id": 19342,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 1933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651008774.508, "dur": 50.428, "args": { "External id": 19343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 1934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651008835.094, "dur": 34.289, "args": { "External id": 19344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651008877.357, "dur": 45.322, "args": { "External id": 19345,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651008929.998, "dur": 28.708, "args": { "External id": 19346,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 1937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651008973.929, "dur": 85.725, "args": { "External id": 19347,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 1938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651009090.194, "dur": 24.903, "args": { "External id": 19348,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 1939 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651009134.722, "dur": 30.844, "args": { "External id": 19349,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1940 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651009187.910, "dur": 22.139, "args": { "External id": 19350,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1941 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651009226.701, "dur": 35.537, "args": { "External id": 19351,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009274.581, "dur": 36.470, "args": { "External id": 19352,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009314.571, "dur": 34.959, "args": { "External id": 19353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1944 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651009376.942, "dur": 174.234, "args": { "External id": 19354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 1945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651009459.236, "dur": 6.852, "args": { "External id": 19355,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651009468.371, "dur": 2.638, "args": { "External id": 19356,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 1947 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651009580.317, "dur": 26.099, "args": { "External id": 19357,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1948 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651009617.800, "dur": 15.317, "args": { "External id": 19358,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009640.861, "dur": 35.858, "args": { "External id": 19359,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009683.462, "dur": 35.949, "args": { "External id": 19360,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009727.222, "dur": 23.732, "args": { "External id": 19361,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009769.589, "dur": 41.975, "args": { "External id": 19362,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009820.499, "dur": 25.080, "args": { "External id": 19363,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 1954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651009853.309, "dur": 31.059, "args": { "External id": 19364,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 1955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651009906.378, "dur": 24.609, "args": { "External id": 19365,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 1956 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651009948.195, "dur": 27.462, "args": { "External id": 19366,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 1957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651010030.499, "dur": 27.464, "args": { "External id": 19367,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 1958 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651010077.112, "dur": 26.533, "args": { "External id": 19368,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 1959 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651010118.267, "dur": 16.860, "args": { "External id": 19369,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 1960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010207.540, "dur": 15.161, "args": { "External id": 19370,"Record function id": 0, "Ev Idx": 1961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010210.713, "dur": 11.068, "args": { "External id": 19371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010214.911, "dur": 5.981, "args": { "External id": 19372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010216.848, "dur": 3.881, "args": { "External id": 19373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010227.079, "dur": 22.370, "args": { "External id": 19374,"Record function id": 0, "Ev Idx": 1965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010242.533, "dur": 5.861, "args": { "External id": 19375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010244.071, "dur": 3.433, "args": { "External id": 19376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010245.332, "dur": 1.888, "args": { "External id": 19377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010254.356, "dur": 5.002, "args": { "External id": 19378,"Record function id": 0, "Ev Idx": 1969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010255.870, "dur": 3.077, "args": { "External id": 19379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010256.470, "dur": 2.033, "args": { "External id": 19380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010257.375, "dur": 1.061, "args": { "External id": 19381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 1972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010262.533, "dur": 4.477, "args": { "External id": 19382,"Record function id": 0, "Ev Idx": 1973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010263.554, "dur": 3.043, "args": { "External id": 19383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010264.111, "dur": 2.026, "args": { "External id": 19384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010264.451, "dur": 1.620, "args": { "External id": 19385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 1976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010270.117, "dur": 3.867, "args": { "External id": 19386,"Record function id": 0, "Ev Idx": 1977 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010271.517, "dur": 2.060, "args": { "External id": 19387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010271.990, "dur": 1.134, "args": { "External id": 19388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1979 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010272.373, "dur": 0.673, "args": { "External id": 19389,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1980 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010277.114, "dur": 4.436, "args": { "External id": 19390,"Record function id": 0, "Ev Idx": 1981 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010278.582, "dur": 2.555, "args": { "External id": 19391,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010279.258, "dur": 1.465, "args": { "External id": 19392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1983 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010279.896, "dur": 0.729, "args": { "External id": 19393,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1984 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010285.107, "dur": 4.490, "args": { "External id": 19394,"Record function id": 0, "Ev Idx": 1985 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010286.316, "dur": 2.887, "args": { "External id": 19395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010287.466, "dur": 1.321, "args": { "External id": 19396,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1987 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010288.223, "dur": 0.466, "args": { "External id": 19397,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1988 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010292.906, "dur": 3.903, "args": { "External id": 19398,"Record function id": 0, "Ev Idx": 1989 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010294.490, "dur": 1.918, "args": { "External id": 19399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010294.959, "dur": 1.034, "args": { "External id": 19400,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1991 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010295.269, "dur": 0.657, "args": { "External id": 19401,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 1992 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010299.854, "dur": 3.810, "args": { "External id": 19402,"Record function id": 0, "Ev Idx": 1993 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651010300.955, "dur": 2.307, "args": { "External id": 19403,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010301.417, "dur": 1.427, "args": { "External id": 19404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1995 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651010302.121, "dur": 0.621, "args": { "External id": 19405,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 1996 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651010307.458, "dur": 36184.287, "args": { "External id": 19406,"Record function id": 0, "Sequence number": 246591, "Fwd thread id": 1, "Ev Idx": 1997 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651010308.970, "dur": 36169.532, "args": { "External id": 19407,"Sequence number": 246591, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 1998 } }, { "ph": "f", "id": 177, "pid": 1336754, "tid": 1381179, "ts": 1295651010308.970, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295651010340.688, "dur": 36.676, "args": { "External id": 19408,"Record function id": 0, "Ev Idx": 1999 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295651010385.372, "dur": 60.215, "args": { "External id": 19409,"Record function id": 0, "Ev Idx": 2000 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.25)", "pid": 1336754, "tid": 1381179, "ts": 1295651010451.376, "dur": 36019.225, "args": { "External id": 19410,"Record function id": 0, "Ev Idx": 2001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651010538.229, "dur": 6.761, "args": { "External id": 19411,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651010554.684, "dur": 4.551, "args": { "External id": 19412,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2003 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651010574.464, "dur": 35053.493, "args": { "External id": 19413,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651010587.686, "dur": 35030.141, "args": { "External id": 19414,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651010638.882, "dur": 15.745, "args": { "External id": 19415,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651010661.667, "dur": 34914.581, "args": { "External id": 19416,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651010664.350, "dur": 34911.022, "args": { "External id": 19417,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651010669.089, "dur": 4.617, "args": { "External id": 19418,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651010675.970, "dur": 34895.004, "args": { "External id": 19419,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651045726.106, "dur": 10.553, "args": { "External id": 19420,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651045729.989, "dur": 6.303, "args": { "External id": 19421,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651045768.747, "dur": 376.777, "args": { "External id": 19422,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651045796.194, "dur": 343.993, "args": { "External id": 19423,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2014, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651045808.295, "dur": 325.781, "args": { "External id": 19424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651046166.555, "dur": 2.129, "args": { "External id": 19425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2016, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046245.795, "dur": 6.939, "args": { "External id": 19426,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046301.222, "dur": 1.992, "args": { "External id": 19427,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046320.924, "dur": 1.291, "args": { "External id": 19428,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046336.536, "dur": 1.054, "args": { "External id": 19429,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046351.498, "dur": 1.125, "args": { "External id": 19430,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046363.938, "dur": 0.936, "args": { "External id": 19431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046377.319, "dur": 1.181, "args": { "External id": 19432,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046391.909, "dur": 2.238, "args": { "External id": 19433,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046406.452, "dur": 1.462, "args": { "External id": 19434,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2025 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651046507.467, "dur": 2821.984, "args": { "External id": 19435,"Record function id": 0, "Ev Idx": 2026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651046526.423, "dur": 1073.078, "args": { "External id": 19436,"Record function id": 0, "Ev Idx": 2027 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651046542.928, "dur": 323.938, "args": { "External id": 19437,"Record function id": 0, "Ev Idx": 2028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046618.841, "dur": 3.661, "args": { "External id": 19438,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046626.011, "dur": 1.058, "args": { "External id": 19439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046629.099, "dur": 0.850, "args": { "External id": 19440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046631.691, "dur": 2.077, "args": { "External id": 19441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046635.608, "dur": 1.332, "args": { "External id": 19442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046638.841, "dur": 1.074, "args": { "External id": 19443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046641.588, "dur": 2.270, "args": { "External id": 19444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046645.482, "dur": 1.161, "args": { "External id": 19445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046648.373, "dur": 1.056, "args": { "External id": 19446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651046650.742, "dur": 0.885, "args": { "External id": 19447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2038 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651046669.321, "dur": 161.542, "args": { "External id": 19448,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651046686.234, "dur": 140.341, "args": { "External id": 19449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651046706.918, "dur": 12.603, "args": { "External id": 19450,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651046722.771, "dur": 74.528, "args": { "External id": 19451,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651046725.713, "dur": 71.193, "args": { "External id": 19452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651046729.800, "dur": 8.742, "args": { "External id": 19453,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651046740.387, "dur": 55.801, "args": { "External id": 19454,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2045 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.23", "pid": 1336754, "tid": 1381179, "ts": 1295651046945.989, "dur": 644.792, "args": { "External id": 19455,"Record function id": 0, "Ev Idx": 2046 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651046963.171, "dur": 613.548, "args": { "External id": 19456,"Record function id": 0, "Ev Idx": 2047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651047083.527, "dur": 7.689, "args": { "External id": 19457,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651047108.878, "dur": 32.404, "args": { "External id": 19458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047114.468, "dur": 1.722, "args": { "External id": 19459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047118.761, "dur": 0.420, "args": { "External id": 19460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047121.237, "dur": 0.435, "args": { "External id": 19461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047123.454, "dur": 0.365, "args": { "External id": 19462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047125.635, "dur": 0.585, "args": { "External id": 19463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047128.365, "dur": 0.386, "args": { "External id": 19464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047130.357, "dur": 1.448, "args": { "External id": 19465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047133.627, "dur": 0.381, "args": { "External id": 19466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047135.719, "dur": 0.382, "args": { "External id": 19467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651047152.243, "dur": 37.750, "args": { "External id": 19468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2059 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651047222.580, "dur": 126.831, "args": { "External id": 19469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651047250.054, "dur": 4.835, "args": { "External id": 19470,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651047260.890, "dur": 10.415, "args": { "External id": 19471,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651047265.022, "dur": 5.881, "args": { "External id": 19472,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047268.796, "dur": 0.640, "args": { "External id": 19473,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651047278.784, "dur": 26.611, "args": { "External id": 19474,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047281.541, "dur": 0.359, "args": { "External id": 19475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047283.677, "dur": 0.364, "args": { "External id": 19476,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047285.993, "dur": 0.473, "args": { "External id": 19477,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047288.104, "dur": 1.345, "args": { "External id": 19478,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047291.503, "dur": 0.335, "args": { "External id": 19479,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047293.604, "dur": 0.471, "args": { "External id": 19480,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047295.671, "dur": 0.325, "args": { "External id": 19481,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047297.991, "dur": 0.813, "args": { "External id": 19482,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651047300.553, "dur": 0.338, "args": { "External id": 19483,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651047318.176, "dur": 23.517, "args": { "External id": 19484,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2075 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651047398.957, "dur": 113.665, "args": { "External id": 19485,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2076 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651047421.739, "dur": 87.365, "args": { "External id": 19486,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2077, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651047431.419, "dur": 72.830, "args": { "External id": 19487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2078 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651047525.927, "dur": 1.797, "args": { "External id": 19488,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2079, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651047606.185, "dur": 1702.492, "args": { "External id": 19489,"Sequence number": 246590, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2080 } }, { "ph": "f", "id": 178, "pid": 1336754, "tid": 1381179, "ts": 1295651047606.185, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651047711.606, "dur": 102.188, "args": { "External id": 19490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2081 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651047852.444, "dur": 42.077, "args": { "External id": 19491,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651047911.231, "dur": 53.631, "args": { "External id": 19492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651047974.138, "dur": 80.128, "args": { "External id": 19493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048066.598, "dur": 48.967, "args": { "External id": 19494,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048123.894, "dur": 32.957, "args": { "External id": 19495,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048164.231, "dur": 43.680, "args": { "External id": 19496,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651048246.924, "dur": 26.769, "args": { "External id": 19497,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2088 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651048297.194, "dur": 27.919, "args": { "External id": 19498,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2089 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651048345.089, "dur": 20.836, "args": { "External id": 19499,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2090 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651048378.850, "dur": 16.292, "args": { "External id": 19500,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048403.921, "dur": 37.697, "args": { "External id": 19501,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048445.347, "dur": 37.471, "args": { "External id": 19502,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2093 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651048522.058, "dur": 172.711, "args": { "External id": 19503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651048601.131, "dur": 6.165, "args": { "External id": 19504,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651048609.590, "dur": 2.177, "args": { "External id": 19505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2096 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651048723.645, "dur": 26.322, "args": { "External id": 19506,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2097 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651048760.918, "dur": 15.248, "args": { "External id": 19507,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048784.652, "dur": 36.065, "args": { "External id": 19508,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048827.842, "dur": 34.995, "args": { "External id": 19509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048872.446, "dur": 23.084, "args": { "External id": 19510,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048900.836, "dur": 43.999, "args": { "External id": 19511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651048957.388, "dur": 63.352, "args": { "External id": 19512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651049032.068, "dur": 40.850, "args": { "External id": 19513,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2104 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651049092.698, "dur": 25.740, "args": { "External id": 19514,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2105 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651049138.311, "dur": 25.056, "args": { "External id": 19515,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2106 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651049177.674, "dur": 19.739, "args": { "External id": 19516,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2107 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651049211.773, "dur": 32.181, "args": { "External id": 19517,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2108 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651049261.006, "dur": 19.097, "args": { "External id": 19518,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049351.009, "dur": 15.516, "args": { "External id": 19519,"Record function id": 0, "Ev Idx": 2110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049354.158, "dur": 11.298, "args": { "External id": 19520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049358.688, "dur": 5.840, "args": { "External id": 19521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049360.425, "dur": 3.977, "args": { "External id": 19522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049370.856, "dur": 4.891, "args": { "External id": 19523,"Record function id": 0, "Ev Idx": 2114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049372.118, "dur": 3.198, "args": { "External id": 19524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049373.069, "dur": 1.789, "args": { "External id": 19525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049373.871, "dur": 0.865, "args": { "External id": 19526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049378.975, "dur": 4.793, "args": { "External id": 19527,"Record function id": 0, "Ev Idx": 2118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049380.189, "dur": 3.183, "args": { "External id": 19528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049380.909, "dur": 2.015, "args": { "External id": 19529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049381.389, "dur": 1.469, "args": { "External id": 19530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049387.080, "dur": 5.029, "args": { "External id": 19531,"Record function id": 0, "Ev Idx": 2122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049388.380, "dur": 3.298, "args": { "External id": 19532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049389.186, "dur": 2.091, "args": { "External id": 19533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049389.538, "dur": 1.664, "args": { "External id": 19534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049395.270, "dur": 3.752, "args": { "External id": 19535,"Record function id": 0, "Ev Idx": 2126 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049396.458, "dur": 2.139, "args": { "External id": 19536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049396.992, "dur": 1.214, "args": { "External id": 19537,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2128 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049397.505, "dur": 0.634, "args": { "External id": 19538,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2129 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049402.095, "dur": 3.623, "args": { "External id": 19539,"Record function id": 0, "Ev Idx": 2130 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049403.293, "dur": 2.039, "args": { "External id": 19540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049403.782, "dur": 1.131, "args": { "External id": 19541,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2132 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049404.193, "dur": 0.623, "args": { "External id": 19542,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2133 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049408.992, "dur": 3.674, "args": { "External id": 19543,"Record function id": 0, "Ev Idx": 2134 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049410.082, "dur": 2.176, "args": { "External id": 19544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049410.603, "dur": 1.236, "args": { "External id": 19545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2136 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049410.881, "dur": 0.859, "args": { "External id": 19546,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2137 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049415.732, "dur": 3.799, "args": { "External id": 19547,"Record function id": 0, "Ev Idx": 2138 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049417.140, "dur": 2.003, "args": { "External id": 19548,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049417.731, "dur": 0.998, "args": { "External id": 19549,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2140 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049417.977, "dur": 0.690, "args": { "External id": 19550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2141 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049422.559, "dur": 3.457, "args": { "External id": 19551,"Record function id": 0, "Ev Idx": 2142 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651049423.640, "dur": 1.989, "args": { "External id": 19552,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049424.112, "dur": 1.101, "args": { "External id": 19553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2144 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651049424.669, "dur": 0.456, "args": { "External id": 19554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2145 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651049429.758, "dur": 36445.899, "args": { "External id": 19555,"Record function id": 0, "Sequence number": 246589, "Fwd thread id": 1, "Ev Idx": 2146 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651049430.897, "dur": 36436.614, "args": { "External id": 19556,"Sequence number": 246589, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2147 } }, { "ph": "f", "id": 179, "pid": 1336754, "tid": 1381179, "ts": 1295651049430.897, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651049459.116, "dur": 40.250, "args": { "External id": 19557,"Record function id": 0, "Ev Idx": 2148 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651049506.976, "dur": 63.119, "args": { "External id": 19558,"Record function id": 0, "Ev Idx": 2149 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.24)", "pid": 1336754, "tid": 1381179, "ts": 1295651049576.545, "dur": 36283.133, "args": { "External id": 19559,"Record function id": 0, "Ev Idx": 2150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651049661.818, "dur": 6.590, "args": { "External id": 19560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651049677.702, "dur": 4.629, "args": { "External id": 19561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2152 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651049700.434, "dur": 35276.693, "args": { "External id": 19562,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651049714.200, "dur": 35253.555, "args": { "External id": 19563,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651049767.538, "dur": 15.537, "args": { "External id": 19564,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651049789.635, "dur": 35135.338, "args": { "External id": 19565,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651049792.091, "dur": 35132.020, "args": { "External id": 19566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651049796.086, "dur": 4.912, "args": { "External id": 19567,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651049802.975, "dur": 35117.475, "args": { "External id": 19568,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651085097.548, "dur": 10.060, "args": { "External id": 19569,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651085101.221, "dur": 5.866, "args": { "External id": 19570,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651085139.412, "dur": 412.905, "args": { "External id": 19571,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651085169.239, "dur": 377.369, "args": { "External id": 19572,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2163, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651085180.701, "dur": 360.309, "args": { "External id": 19573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651085573.514, "dur": 2.187, "args": { "External id": 19574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2165, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085638.518, "dur": 6.571, "args": { "External id": 19575,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085692.584, "dur": 1.537, "args": { "External id": 19576,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085712.391, "dur": 1.056, "args": { "External id": 19577,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085727.435, "dur": 1.042, "args": { "External id": 19578,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085741.330, "dur": 0.834, "args": { "External id": 19579,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085754.632, "dur": 0.919, "args": { "External id": 19580,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085767.425, "dur": 0.942, "args": { "External id": 19581,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085783.025, "dur": 3.124, "args": { "External id": 19582,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651085797.694, "dur": 1.174, "args": { "External id": 19583,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2174 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651085889.425, "dur": 2747.399, "args": { "External id": 19584,"Record function id": 0, "Ev Idx": 2175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651085907.040, "dur": 999.200, "args": { "External id": 19585,"Record function id": 0, "Ev Idx": 2176 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651085921.411, "dur": 376.249, "args": { "External id": 19586,"Record function id": 0, "Ev Idx": 2177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086031.775, "dur": 4.943, "args": { "External id": 19587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086040.441, "dur": 1.027, "args": { "External id": 19588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086043.315, "dur": 1.082, "args": { "External id": 19589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086045.780, "dur": 2.545, "args": { "External id": 19590,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086050.156, "dur": 0.951, "args": { "External id": 19591,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086052.866, "dur": 0.678, "args": { "External id": 19592,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086055.282, "dur": 2.805, "args": { "External id": 19593,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086059.681, "dur": 1.053, "args": { "External id": 19594,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086062.641, "dur": 1.109, "args": { "External id": 19595,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651086065.217, "dur": 0.785, "args": { "External id": 19596,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2187 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651086085.002, "dur": 176.122, "args": { "External id": 19597,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651086102.211, "dur": 153.483, "args": { "External id": 19598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651086123.823, "dur": 13.226, "args": { "External id": 19599,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651086140.196, "dur": 69.649, "args": { "External id": 19600,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651086143.079, "dur": 66.323, "args": { "External id": 19601,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086147.281, "dur": 6.974, "args": { "External id": 19602,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651086156.094, "dur": 52.710, "args": { "External id": 19603,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2194 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.22", "pid": 1336754, "tid": 1381179, "ts": 1295651086376.403, "dur": 521.572, "args": { "External id": 19604,"Record function id": 0, "Ev Idx": 2195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651086394.069, "dur": 491.531, "args": { "External id": 19605,"Record function id": 0, "Ev Idx": 2196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651086448.229, "dur": 5.825, "args": { "External id": 19606,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651086470.111, "dur": 31.267, "args": { "External id": 19607,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086475.198, "dur": 1.396, "args": { "External id": 19608,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086479.156, "dur": 0.570, "args": { "External id": 19609,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086481.487, "dur": 0.515, "args": { "External id": 19610,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086484.132, "dur": 0.372, "args": { "External id": 19611,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086486.218, "dur": 0.376, "args": { "External id": 19612,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086488.256, "dur": 0.437, "args": { "External id": 19613,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086490.418, "dur": 1.511, "args": { "External id": 19614,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086493.521, "dur": 0.460, "args": { "External id": 19615,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086495.333, "dur": 0.318, "args": { "External id": 19616,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651086510.709, "dur": 31.351, "args": { "External id": 19617,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2208 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651086573.604, "dur": 101.161, "args": { "External id": 19618,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651086583.553, "dur": 3.300, "args": { "External id": 19619,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651086591.975, "dur": 9.950, "args": { "External id": 19620,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651086596.161, "dur": 5.382, "args": { "External id": 19621,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086599.880, "dur": 0.549, "args": { "External id": 19622,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651086609.515, "dur": 26.513, "args": { "External id": 19623,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086611.481, "dur": 0.661, "args": { "External id": 19624,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086614.495, "dur": 0.593, "args": { "External id": 19625,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086616.909, "dur": 0.519, "args": { "External id": 19626,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086619.029, "dur": 2.030, "args": { "External id": 19627,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086622.550, "dur": 0.367, "args": { "External id": 19628,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086624.753, "dur": 0.317, "args": { "External id": 19629,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086626.408, "dur": 0.374, "args": { "External id": 19630,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086628.362, "dur": 0.468, "args": { "External id": 19631,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651086630.266, "dur": 0.374, "args": { "External id": 19632,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651086646.933, "dur": 20.467, "args": { "External id": 19633,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2224 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651086719.963, "dur": 104.925, "args": { "External id": 19634,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2225 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651086739.967, "dur": 81.404, "args": { "External id": 19635,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2226, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651086749.063, "dur": 68.337, "args": { "External id": 19636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2227 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651086836.504, "dur": 1.951, "args": { "External id": 19637,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2228, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651086912.954, "dur": 1703.038, "args": { "External id": 19638,"Sequence number": 246588, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2229 } }, { "ph": "f", "id": 180, "pid": 1336754, "tid": 1381179, "ts": 1295651086912.954, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087057.967, "dur": 105.964, "args": { "External id": 19639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2230 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651087203.813, "dur": 56.098, "args": { "External id": 19640,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651087280.068, "dur": 56.344, "args": { "External id": 19641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087346.189, "dur": 35.562, "args": { "External id": 19642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087389.599, "dur": 46.130, "args": { "External id": 19643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087443.999, "dur": 29.110, "args": { "External id": 19644,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087481.167, "dur": 42.603, "args": { "External id": 19645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651087549.343, "dur": 23.131, "args": { "External id": 19646,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2237 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651087595.477, "dur": 28.496, "args": { "External id": 19647,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2238 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651087642.064, "dur": 20.646, "args": { "External id": 19648,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2239 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651087676.934, "dur": 16.533, "args": { "External id": 19649,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087702.036, "dur": 31.226, "args": { "External id": 19650,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651087736.646, "dur": 33.830, "args": { "External id": 19651,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2242 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651087796.865, "dur": 168.364, "args": { "External id": 19652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651087871.322, "dur": 6.230, "args": { "External id": 19653,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651087879.797, "dur": 1.971, "args": { "External id": 19654,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2245 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651088034.871, "dur": 31.103, "args": { "External id": 19655,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2246 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651088076.723, "dur": 14.328, "args": { "External id": 19656,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088101.143, "dur": 47.469, "args": { "External id": 19657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088155.392, "dur": 36.809, "args": { "External id": 19658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088219.747, "dur": 41.629, "args": { "External id": 19659,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088270.517, "dur": 34.849, "args": { "External id": 19660,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088313.482, "dur": 36.307, "args": { "External id": 19661,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651088362.782, "dur": 37.911, "args": { "External id": 19662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2253 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651088420.416, "dur": 26.151, "args": { "External id": 19663,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2254 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651088466.526, "dur": 24.741, "args": { "External id": 19664,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2255 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651088504.659, "dur": 20.697, "args": { "External id": 19665,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2256 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651088542.405, "dur": 17.251, "args": { "External id": 19666,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2257 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651088571.852, "dur": 16.122, "args": { "External id": 19667,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088658.465, "dur": 15.813, "args": { "External id": 19668,"Record function id": 0, "Ev Idx": 2259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088662.140, "dur": 11.049, "args": { "External id": 19669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088666.273, "dur": 6.053, "args": { "External id": 19670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088668.035, "dur": 4.163, "args": { "External id": 19671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088678.319, "dur": 4.933, "args": { "External id": 19672,"Record function id": 0, "Ev Idx": 2263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088679.746, "dur": 3.065, "args": { "External id": 19673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088680.558, "dur": 1.811, "args": { "External id": 19674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088681.389, "dur": 0.873, "args": { "External id": 19675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088686.637, "dur": 5.127, "args": { "External id": 19676,"Record function id": 0, "Ev Idx": 2267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088687.966, "dur": 3.392, "args": { "External id": 19677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088688.715, "dur": 2.226, "args": { "External id": 19678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088689.245, "dur": 1.633, "args": { "External id": 19679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088694.910, "dur": 3.848, "args": { "External id": 19680,"Record function id": 0, "Ev Idx": 2271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088696.050, "dur": 2.296, "args": { "External id": 19681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088696.517, "dur": 1.435, "args": { "External id": 19682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088697.013, "dur": 0.874, "args": { "External id": 19683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088701.848, "dur": 3.418, "args": { "External id": 19684,"Record function id": 0, "Ev Idx": 2275 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088702.979, "dur": 1.901, "args": { "External id": 19685,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088703.466, "dur": 0.996, "args": { "External id": 19686,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2277 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088703.792, "dur": 0.601, "args": { "External id": 19687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2278 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088708.342, "dur": 3.520, "args": { "External id": 19688,"Record function id": 0, "Ev Idx": 2279 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088709.371, "dur": 2.116, "args": { "External id": 19689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088709.846, "dur": 1.238, "args": { "External id": 19690,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2281 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088710.307, "dur": 0.679, "args": { "External id": 19691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2282 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088715.180, "dur": 3.235, "args": { "External id": 19692,"Record function id": 0, "Ev Idx": 2283 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088716.265, "dur": 1.759, "args": { "External id": 19693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088716.716, "dur": 0.859, "args": { "External id": 19694,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2285 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088717.009, "dur": 0.461, "args": { "External id": 19695,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2286 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088721.457, "dur": 3.446, "args": { "External id": 19696,"Record function id": 0, "Ev Idx": 2287 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088722.607, "dur": 1.926, "args": { "External id": 19697,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088723.103, "dur": 1.022, "args": { "External id": 19698,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2289 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088723.411, "dur": 0.647, "args": { "External id": 19699,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2290 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088727.868, "dur": 4.190, "args": { "External id": 19700,"Record function id": 0, "Ev Idx": 2291 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651088729.563, "dur": 2.103, "args": { "External id": 19701,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088730.015, "dur": 1.239, "args": { "External id": 19702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2293 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651088730.493, "dur": 0.659, "args": { "External id": 19703,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2294 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651088735.398, "dur": 35957.465, "args": { "External id": 19704,"Record function id": 0, "Sequence number": 246587, "Fwd thread id": 1, "Ev Idx": 2295 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651088736.586, "dur": 35947.699, "args": { "External id": 19705,"Sequence number": 246587, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2296 } }, { "ph": "f", "id": 181, "pid": 1336754, "tid": 1381179, "ts": 1295651088736.586, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651088767.164, "dur": 35.088, "args": { "External id": 19706,"Record function id": 0, "Ev Idx": 2297 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651088809.697, "dur": 57.923, "args": { "External id": 19707,"Record function id": 0, "Ev Idx": 2298 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.23)", "pid": 1336754, "tid": 1381179, "ts": 1295651088873.525, "dur": 35802.627, "args": { "External id": 19708,"Record function id": 0, "Ev Idx": 2299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651088959.223, "dur": 6.647, "args": { "External id": 19709,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651088975.147, "dur": 41.211, "args": { "External id": 19710,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2301 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651089034.866, "dur": 34893.499, "args": { "External id": 19711,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651089048.789, "dur": 34871.181, "args": { "External id": 19712,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651089091.987, "dur": 15.527, "args": { "External id": 19713,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651089113.916, "dur": 34763.444, "args": { "External id": 19714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651089116.813, "dur": 34759.950, "args": { "External id": 19715,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651089121.052, "dur": 5.264, "args": { "External id": 19716,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651089128.539, "dur": 34744.424, "args": { "External id": 19717,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651124041.987, "dur": 9.602, "args": { "External id": 19718,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651124045.323, "dur": 5.720, "args": { "External id": 19719,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651124081.389, "dur": 306.359, "args": { "External id": 19720,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651124108.294, "dur": 274.140, "args": { "External id": 19721,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2312, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651124120.067, "dur": 256.500, "args": { "External id": 19722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651124406.871, "dur": 2.235, "args": { "External id": 19723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2314, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124463.875, "dur": 6.416, "args": { "External id": 19724,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124515.307, "dur": 1.401, "args": { "External id": 19725,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124533.132, "dur": 2.298, "args": { "External id": 19726,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124546.925, "dur": 1.033, "args": { "External id": 19727,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124560.386, "dur": 1.082, "args": { "External id": 19728,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124572.338, "dur": 1.029, "args": { "External id": 19729,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124586.111, "dur": 2.144, "args": { "External id": 19730,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124601.058, "dur": 2.145, "args": { "External id": 19731,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124615.246, "dur": 0.931, "args": { "External id": 19732,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2323 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651124706.576, "dur": 2776.077, "args": { "External id": 19733,"Record function id": 0, "Ev Idx": 2324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651124725.583, "dur": 1030.820, "args": { "External id": 19734,"Record function id": 0, "Ev Idx": 2325 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651124740.874, "dur": 356.937, "args": { "External id": 19735,"Record function id": 0, "Ev Idx": 2326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124812.650, "dur": 3.917, "args": { "External id": 19736,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124819.802, "dur": 1.024, "args": { "External id": 19737,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124822.434, "dur": 2.045, "args": { "External id": 19738,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124826.064, "dur": 0.809, "args": { "External id": 19739,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124828.296, "dur": 0.840, "args": { "External id": 19740,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124830.789, "dur": 0.824, "args": { "External id": 19741,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124833.142, "dur": 2.027, "args": { "External id": 19742,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124837.117, "dur": 1.252, "args": { "External id": 19743,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124839.713, "dur": 0.709, "args": { "External id": 19744,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651124841.775, "dur": 1.088, "args": { "External id": 19745,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2336 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651124862.183, "dur": 197.740, "args": { "External id": 19746,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651124877.700, "dur": 177.077, "args": { "External id": 19747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651124898.087, "dur": 13.967, "args": { "External id": 19748,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651124915.364, "dur": 107.553, "args": { "External id": 19749,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651124918.131, "dur": 104.337, "args": { "External id": 19750,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651124922.086, "dur": 7.131, "args": { "External id": 19751,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651124931.381, "dur": 89.946, "args": { "External id": 19752,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2343 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.21", "pid": 1336754, "tid": 1381179, "ts": 1295651125183.423, "dur": 564.576, "args": { "External id": 19753,"Record function id": 0, "Ev Idx": 2344 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651125201.075, "dur": 534.512, "args": { "External id": 19754,"Record function id": 0, "Ev Idx": 2345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651125277.038, "dur": 6.839, "args": { "External id": 19755,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651125303.354, "dur": 29.693, "args": { "External id": 19756,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125308.454, "dur": 1.714, "args": { "External id": 19757,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125312.260, "dur": 0.509, "args": { "External id": 19758,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125314.601, "dur": 0.474, "args": { "External id": 19759,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125316.420, "dur": 0.370, "args": { "External id": 19760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125318.155, "dur": 0.494, "args": { "External id": 19761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125320.188, "dur": 1.450, "args": { "External id": 19762,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125323.414, "dur": 0.394, "args": { "External id": 19763,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125325.366, "dur": 0.344, "args": { "External id": 19764,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125327.390, "dur": 0.415, "args": { "External id": 19765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651125351.310, "dur": 35.837, "args": { "External id": 19766,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2357 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651125421.573, "dur": 100.937, "args": { "External id": 19767,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651125431.800, "dur": 3.168, "args": { "External id": 19768,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651125440.648, "dur": 9.840, "args": { "External id": 19769,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651125444.668, "dur": 5.423, "args": { "External id": 19770,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125448.277, "dur": 0.491, "args": { "External id": 19771,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651125457.007, "dur": 24.777, "args": { "External id": 19772,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125459.133, "dur": 0.359, "args": { "External id": 19773,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125461.147, "dur": 0.421, "args": { "External id": 19774,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125463.311, "dur": 1.613, "args": { "External id": 19775,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125466.286, "dur": 0.655, "args": { "External id": 19776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125468.973, "dur": 0.430, "args": { "External id": 19777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125470.840, "dur": 0.353, "args": { "External id": 19778,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125472.873, "dur": 0.388, "args": { "External id": 19779,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125474.733, "dur": 0.330, "args": { "External id": 19780,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651125476.906, "dur": 0.403, "args": { "External id": 19781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651125493.401, "dur": 21.509, "args": { "External id": 19782,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2373 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651125566.775, "dur": 106.425, "args": { "External id": 19783,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2374 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651125587.390, "dur": 82.554, "args": { "External id": 19784,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2375, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651125596.719, "dur": 68.741, "args": { "External id": 19785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2376 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651125686.715, "dur": 1.558, "args": { "External id": 19786,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2377, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651125763.192, "dur": 1699.693, "args": { "External id": 19787,"Sequence number": 246586, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2378 } }, { "ph": "f", "id": 182, "pid": 1336754, "tid": 1381179, "ts": 1295651125763.192, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651125866.811, "dur": 103.182, "args": { "External id": 19788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2379 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651126046.395, "dur": 40.887, "args": { "External id": 19789,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651126108.526, "dur": 59.586, "args": { "External id": 19790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126178.436, "dur": 36.711, "args": { "External id": 19791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126223.031, "dur": 64.939, "args": { "External id": 19792,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126299.738, "dur": 31.793, "args": { "External id": 19793,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126339.337, "dur": 42.338, "args": { "External id": 19794,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651126405.167, "dur": 24.378, "args": { "External id": 19795,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2386 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651126457.885, "dur": 29.206, "args": { "External id": 19796,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2387 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651126507.357, "dur": 20.723, "args": { "External id": 19797,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2388 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651126542.429, "dur": 16.880, "args": { "External id": 19798,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126569.436, "dur": 32.213, "args": { "External id": 19799,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126605.029, "dur": 35.077, "args": { "External id": 19800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2391 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651126668.699, "dur": 170.828, "args": { "External id": 19801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651126746.300, "dur": 5.879, "args": { "External id": 19802,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651126754.380, "dur": 2.492, "args": { "External id": 19803,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2394 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651126868.944, "dur": 25.415, "args": { "External id": 19804,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2395 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651126905.224, "dur": 14.934, "args": { "External id": 19805,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126928.385, "dur": 36.959, "args": { "External id": 19806,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651126973.056, "dur": 74.025, "args": { "External id": 19807,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651127059.616, "dur": 26.868, "args": { "External id": 19808,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651127092.430, "dur": 30.900, "args": { "External id": 19809,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651127130.188, "dur": 23.170, "args": { "External id": 19810,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651127173.329, "dur": 41.534, "args": { "External id": 19811,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651127251.190, "dur": 31.021, "args": { "External id": 19812,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2403 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651127301.216, "dur": 23.945, "args": { "External id": 19813,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651127342.226, "dur": 17.624, "args": { "External id": 19814,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2405 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651127374.893, "dur": 19.919, "args": { "External id": 19815,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2406 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651127414.523, "dur": 16.606, "args": { "External id": 19816,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127505.142, "dur": 15.522, "args": { "External id": 19817,"Record function id": 0, "Ev Idx": 2408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127508.551, "dur": 11.155, "args": { "External id": 19818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127512.821, "dur": 5.876, "args": { "External id": 19819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127514.388, "dur": 4.176, "args": { "External id": 19820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127524.870, "dur": 5.553, "args": { "External id": 19821,"Record function id": 0, "Ev Idx": 2412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127526.497, "dur": 3.499, "args": { "External id": 19822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127527.212, "dur": 2.338, "args": { "External id": 19823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127528.082, "dur": 1.359, "args": { "External id": 19824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127534.476, "dur": 4.407, "args": { "External id": 19825,"Record function id": 0, "Ev Idx": 2416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127535.850, "dur": 2.623, "args": { "External id": 19826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127536.409, "dur": 1.651, "args": { "External id": 19827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127536.886, "dur": 1.091, "args": { "External id": 19828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127541.986, "dur": 3.748, "args": { "External id": 19829,"Record function id": 0, "Ev Idx": 2420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127543.216, "dur": 2.117, "args": { "External id": 19830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127543.717, "dur": 1.221, "args": { "External id": 19831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127544.213, "dur": 0.663, "args": { "External id": 19832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127548.788, "dur": 3.619, "args": { "External id": 19833,"Record function id": 0, "Ev Idx": 2424 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127550.042, "dur": 1.963, "args": { "External id": 19834,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127550.729, "dur": 0.882, "args": { "External id": 19835,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2426 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127551.049, "dur": 0.500, "args": { "External id": 19836,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2427 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127555.628, "dur": 3.712, "args": { "External id": 19837,"Record function id": 0, "Ev Idx": 2428 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127556.886, "dur": 2.051, "args": { "External id": 19838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127557.333, "dur": 1.182, "args": { "External id": 19839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2430 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127557.753, "dur": 0.661, "args": { "External id": 19840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2431 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127562.548, "dur": 3.993, "args": { "External id": 19841,"Record function id": 0, "Ev Idx": 2432 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127563.811, "dur": 2.333, "args": { "External id": 19842,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127564.466, "dur": 1.282, "args": { "External id": 19843,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2434 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127564.769, "dur": 0.887, "args": { "External id": 19844,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2435 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127569.636, "dur": 3.640, "args": { "External id": 19845,"Record function id": 0, "Ev Idx": 2436 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127570.742, "dur": 2.138, "args": { "External id": 19846,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127571.186, "dur": 1.284, "args": { "External id": 19847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2438 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127571.449, "dur": 0.959, "args": { "External id": 19848,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2439 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127576.455, "dur": 4.003, "args": { "External id": 19849,"Record function id": 0, "Ev Idx": 2440 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651127577.511, "dur": 2.515, "args": { "External id": 19850,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127577.939, "dur": 1.671, "args": { "External id": 19851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2442 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651127578.826, "dur": 0.702, "args": { "External id": 19852,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2443 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651127584.199, "dur": 35880.742, "args": { "External id": 19853,"Record function id": 0, "Sequence number": 246585, "Fwd thread id": 1, "Ev Idx": 2444 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651127585.693, "dur": 35870.682, "args": { "External id": 19854,"Sequence number": 246585, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2445 } }, { "ph": "f", "id": 183, "pid": 1336754, "tid": 1381179, "ts": 1295651127585.693, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651127615.068, "dur": 37.563, "args": { "External id": 19855,"Record function id": 0, "Ev Idx": 2446 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651127659.939, "dur": 59.399, "args": { "External id": 19856,"Record function id": 0, "Ev Idx": 2447 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.22)", "pid": 1336754, "tid": 1381179, "ts": 1295651127725.373, "dur": 35721.779, "args": { "External id": 19857,"Record function id": 0, "Ev Idx": 2448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651127813.588, "dur": 6.459, "args": { "External id": 19858,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651127828.979, "dur": 4.497, "args": { "External id": 19859,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2450 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651127847.614, "dur": 34742.510, "args": { "External id": 19860,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651127861.322, "dur": 34717.833, "args": { "External id": 19861,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651127905.273, "dur": 13.477, "args": { "External id": 19862,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651127925.443, "dur": 34610.203, "args": { "External id": 19863,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651127928.065, "dur": 34606.411, "args": { "External id": 19864,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651127931.737, "dur": 5.196, "args": { "External id": 19865,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651127938.733, "dur": 34591.006, "args": { "External id": 19866,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651162690.845, "dur": 10.857, "args": { "External id": 19867,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651162694.476, "dur": 6.853, "args": { "External id": 19868,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651162733.356, "dur": 401.063, "args": { "External id": 19869,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651162760.472, "dur": 368.779, "args": { "External id": 19870,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2461, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651162772.085, "dur": 351.432, "args": { "External id": 19871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651163155.637, "dur": 2.506, "args": { "External id": 19872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2463, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163220.337, "dur": 6.908, "args": { "External id": 19873,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163288.932, "dur": 2.597, "args": { "External id": 19874,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163308.823, "dur": 1.185, "args": { "External id": 19875,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163322.158, "dur": 1.114, "args": { "External id": 19876,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163335.248, "dur": 1.232, "args": { "External id": 19877,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163347.340, "dur": 1.224, "args": { "External id": 19878,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163359.264, "dur": 1.134, "args": { "External id": 19879,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163371.244, "dur": 2.320, "args": { "External id": 19880,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163383.589, "dur": 0.968, "args": { "External id": 19881,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2472 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651163481.089, "dur": 2780.102, "args": { "External id": 19882,"Record function id": 0, "Ev Idx": 2473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651163499.979, "dur": 1022.074, "args": { "External id": 19883,"Record function id": 0, "Ev Idx": 2474 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651163513.979, "dur": 322.399, "args": { "External id": 19884,"Record function id": 0, "Ev Idx": 2475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163588.100, "dur": 3.981, "args": { "External id": 19885,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163595.475, "dur": 1.479, "args": { "External id": 19886,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163599.137, "dur": 0.972, "args": { "External id": 19887,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163601.816, "dur": 1.042, "args": { "External id": 19888,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163604.466, "dur": 0.994, "args": { "External id": 19889,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163608.930, "dur": 1.086, "args": { "External id": 19890,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163611.618, "dur": 2.333, "args": { "External id": 19891,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163615.388, "dur": 1.242, "args": { "External id": 19892,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163618.125, "dur": 1.081, "args": { "External id": 19893,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651163622.628, "dur": 1.429, "args": { "External id": 19894,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2485 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651163640.992, "dur": 164.519, "args": { "External id": 19895,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651163669.069, "dur": 131.729, "args": { "External id": 19896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651163686.321, "dur": 14.059, "args": { "External id": 19897,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651163703.452, "dur": 69.676, "args": { "External id": 19898,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651163706.170, "dur": 66.569, "args": { "External id": 19899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651163709.349, "dur": 7.225, "args": { "External id": 19900,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651163718.113, "dur": 54.082, "args": { "External id": 19901,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2492 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.20", "pid": 1336754, "tid": 1381179, "ts": 1295651163913.647, "dur": 599.776, "args": { "External id": 19902,"Record function id": 0, "Ev Idx": 2493 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651163929.398, "dur": 570.943, "args": { "External id": 19903,"Record function id": 0, "Ev Idx": 2494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651163979.649, "dur": 44.378, "args": { "External id": 19904,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651164043.088, "dur": 31.418, "args": { "External id": 19905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164048.088, "dur": 1.714, "args": { "External id": 19906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164052.420, "dur": 0.606, "args": { "External id": 19907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164054.732, "dur": 0.554, "args": { "External id": 19908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164057.372, "dur": 0.380, "args": { "External id": 19909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164059.468, "dur": 0.457, "args": { "External id": 19910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164061.728, "dur": 0.909, "args": { "External id": 19911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164064.164, "dur": 0.942, "args": { "External id": 19912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164066.542, "dur": 0.771, "args": { "External id": 19913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164068.800, "dur": 0.637, "args": { "External id": 19914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651164083.737, "dur": 34.173, "args": { "External id": 19915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2506 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651164149.404, "dur": 125.312, "args": { "External id": 19916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651164160.104, "dur": 3.629, "args": { "External id": 19917,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651164168.085, "dur": 13.676, "args": { "External id": 19918,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651164175.759, "dur": 5.606, "args": { "External id": 19919,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164179.226, "dur": 0.808, "args": { "External id": 19920,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651164188.151, "dur": 25.695, "args": { "External id": 19921,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164190.360, "dur": 0.718, "args": { "External id": 19922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164192.631, "dur": 0.846, "args": { "External id": 19923,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164195.136, "dur": 0.675, "args": { "External id": 19924,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164197.021, "dur": 0.843, "args": { "External id": 19925,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164199.458, "dur": 0.683, "args": { "External id": 19926,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164201.711, "dur": 0.885, "args": { "External id": 19927,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164204.205, "dur": 0.667, "args": { "External id": 19928,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164206.259, "dur": 0.724, "args": { "External id": 19929,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651164208.494, "dur": 0.856, "args": { "External id": 19930,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651164223.351, "dur": 42.069, "args": { "External id": 19931,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2522 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651164322.350, "dur": 111.341, "args": { "External id": 19932,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2523 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651164344.448, "dur": 85.820, "args": { "External id": 19933,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2524, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651164354.393, "dur": 71.068, "args": { "External id": 19934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2525 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651164449.264, "dur": 1.826, "args": { "External id": 19935,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2526, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651164528.447, "dur": 1695.375, "args": { "External id": 19936,"Sequence number": 246584, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2527 } }, { "ph": "f", "id": 184, "pid": 1336754, "tid": 1381179, "ts": 1295651164528.447, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651164634.214, "dur": 106.540, "args": { "External id": 19937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2528 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651164781.285, "dur": 37.137, "args": { "External id": 19938,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651164834.024, "dur": 48.762, "args": { "External id": 19939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651164891.838, "dur": 32.604, "args": { "External id": 19940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651164931.484, "dur": 44.496, "args": { "External id": 19941,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165025.480, "dur": 36.755, "args": { "External id": 19942,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165071.751, "dur": 45.114, "args": { "External id": 19943,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651165142.661, "dur": 24.172, "args": { "External id": 19944,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2535 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651165185.995, "dur": 28.238, "args": { "External id": 19945,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2536 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651165250.940, "dur": 23.944, "args": { "External id": 19946,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2537 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651165292.775, "dur": 15.677, "args": { "External id": 19947,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165319.752, "dur": 36.092, "args": { "External id": 19948,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165359.277, "dur": 35.456, "args": { "External id": 19949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2540 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651165423.084, "dur": 175.873, "args": { "External id": 19950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651165502.842, "dur": 6.695, "args": { "External id": 19951,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651165511.523, "dur": 2.780, "args": { "External id": 19952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2543 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651165639.868, "dur": 27.975, "args": { "External id": 19953,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2544 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651165680.921, "dur": 14.366, "args": { "External id": 19954,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165705.641, "dur": 38.026, "args": { "External id": 19955,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165751.356, "dur": 37.256, "args": { "External id": 19956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165796.612, "dur": 27.461, "args": { "External id": 19957,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165830.019, "dur": 31.291, "args": { "External id": 19958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165872.590, "dur": 36.713, "args": { "External id": 19959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651165921.890, "dur": 38.689, "args": { "External id": 19960,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2551 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651165979.820, "dur": 63.713, "args": { "External id": 19961,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2552 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651166066.908, "dur": 25.569, "args": { "External id": 19962,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2553 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651166108.467, "dur": 22.442, "args": { "External id": 19963,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2554 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651166145.836, "dur": 16.925, "args": { "External id": 19964,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2555 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651166175.468, "dur": 19.989, "args": { "External id": 19965,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166284.334, "dur": 41.237, "args": { "External id": 19966,"Record function id": 0, "Ev Idx": 2557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166287.460, "dur": 36.965, "args": { "External id": 19967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166291.379, "dur": 32.088, "args": { "External id": 19968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166318.727, "dur": 4.557, "args": { "External id": 19969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166329.990, "dur": 5.527, "args": { "External id": 19970,"Record function id": 0, "Ev Idx": 2561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166331.460, "dur": 3.640, "args": { "External id": 19971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166332.274, "dur": 2.347, "args": { "External id": 19972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166332.890, "dur": 1.632, "args": { "External id": 19973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166338.723, "dur": 4.136, "args": { "External id": 19974,"Record function id": 0, "Ev Idx": 2565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166339.743, "dur": 2.661, "args": { "External id": 19975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166340.222, "dur": 1.755, "args": { "External id": 19976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166340.578, "dur": 1.336, "args": { "External id": 19977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166346.048, "dur": 4.036, "args": { "External id": 19978,"Record function id": 0, "Ev Idx": 2569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166347.275, "dur": 2.419, "args": { "External id": 19979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166347.830, "dur": 1.447, "args": { "External id": 19980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166348.109, "dur": 1.101, "args": { "External id": 19981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166353.132, "dur": 3.728, "args": { "External id": 19982,"Record function id": 0, "Ev Idx": 2573 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166354.262, "dur": 2.200, "args": { "External id": 19983,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166354.772, "dur": 1.293, "args": { "External id": 19984,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2575 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166355.086, "dur": 0.916, "args": { "External id": 19985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2576 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166359.947, "dur": 3.992, "args": { "External id": 19986,"Record function id": 0, "Ev Idx": 2577 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166361.322, "dur": 2.208, "args": { "External id": 19987,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166361.949, "dur": 1.200, "args": { "External id": 19988,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2579 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166362.428, "dur": 0.654, "args": { "External id": 19989,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2580 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166367.738, "dur": 3.533, "args": { "External id": 19990,"Record function id": 0, "Ev Idx": 2581 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166368.618, "dur": 2.241, "args": { "External id": 19991,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166369.107, "dur": 1.343, "args": { "External id": 19992,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2583 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166369.387, "dur": 0.984, "args": { "External id": 19993,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2584 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166374.498, "dur": 4.836, "args": { "External id": 19994,"Record function id": 0, "Ev Idx": 2585 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166375.361, "dur": 3.584, "args": { "External id": 19995,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166375.810, "dur": 2.744, "args": { "External id": 19996,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2587 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166377.675, "dur": 0.791, "args": { "External id": 19997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2588 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166382.661, "dur": 3.275, "args": { "External id": 19998,"Record function id": 0, "Ev Idx": 2589 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651166383.568, "dur": 1.977, "args": { "External id": 19999,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166384.040, "dur": 1.109, "args": { "External id": 20000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2591 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651166384.393, "dur": 0.676, "args": { "External id": 20001,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2592 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651166389.512, "dur": 37467.707, "args": { "External id": 20002,"Record function id": 0, "Sequence number": 246583, "Fwd thread id": 1, "Ev Idx": 2593 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651166390.651, "dur": 37458.156, "args": { "External id": 20003,"Sequence number": 246583, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2594 } }, { "ph": "f", "id": 185, "pid": 1336754, "tid": 1381179, "ts": 1295651166390.651, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651166422.857, "dur": 38.455, "args": { "External id": 20004,"Record function id": 0, "Ev Idx": 2595 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651166469.019, "dur": 60.848, "args": { "External id": 20005,"Record function id": 0, "Ev Idx": 2596 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.21)", "pid": 1336754, "tid": 1381179, "ts": 1295651166535.745, "dur": 37304.647, "args": { "External id": 20006,"Record function id": 0, "Ev Idx": 2597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651166625.724, "dur": 7.304, "args": { "External id": 20007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651166642.410, "dur": 4.702, "args": { "External id": 20008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2599 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651166665.060, "dur": 36341.146, "args": { "External id": 20009,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651166677.742, "dur": 36298.864, "args": { "External id": 20010,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651166716.911, "dur": 14.556, "args": { "External id": 20011,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651166737.817, "dur": 36197.863, "args": { "External id": 20012,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651166740.245, "dur": 36194.761, "args": { "External id": 20013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651166743.834, "dur": 5.973, "args": { "External id": 20014,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651166754.949, "dur": 36176.478, "args": { "External id": 20015,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651203099.181, "dur": 9.033, "args": { "External id": 20016,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651203102.227, "dur": 5.550, "args": { "External id": 20017,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651203139.994, "dur": 412.332, "args": { "External id": 20018,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651203166.515, "dur": 380.421, "args": { "External id": 20019,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2610, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651203177.744, "dur": 363.508, "args": { "External id": 20020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651203573.913, "dur": 2.356, "args": { "External id": 20021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2612, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203637.932, "dur": 7.040, "args": { "External id": 20022,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203690.765, "dur": 1.537, "args": { "External id": 20023,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203708.659, "dur": 1.432, "args": { "External id": 20024,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203720.707, "dur": 1.624, "args": { "External id": 20025,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203732.015, "dur": 1.414, "args": { "External id": 20026,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203742.976, "dur": 1.387, "args": { "External id": 20027,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203754.633, "dur": 1.180, "args": { "External id": 20028,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203766.968, "dur": 3.172, "args": { "External id": 20029,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651203779.920, "dur": 1.254, "args": { "External id": 20030,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2621 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651203871.115, "dur": 2771.337, "args": { "External id": 20031,"Record function id": 0, "Ev Idx": 2622 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651203890.112, "dur": 1032.864, "args": { "External id": 20032,"Record function id": 0, "Ev Idx": 2623 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651203905.348, "dur": 392.773, "args": { "External id": 20033,"Record function id": 0, "Ev Idx": 2624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651203976.826, "dur": 50.794, "args": { "External id": 20034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204034.164, "dur": 1.837, "args": { "External id": 20035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204037.979, "dur": 1.279, "args": { "External id": 20036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204041.043, "dur": 1.207, "args": { "External id": 20037,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204043.717, "dur": 1.338, "args": { "External id": 20038,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204046.516, "dur": 1.082, "args": { "External id": 20039,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204049.085, "dur": 2.258, "args": { "External id": 20040,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204052.819, "dur": 0.896, "args": { "External id": 20041,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204055.273, "dur": 1.523, "args": { "External id": 20042,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651204057.968, "dur": 1.148, "args": { "External id": 20043,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2634 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651204078.082, "dur": 184.394, "args": { "External id": 20044,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651204094.701, "dur": 162.259, "args": { "External id": 20045,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651204115.123, "dur": 12.908, "args": { "External id": 20046,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651204131.052, "dur": 73.629, "args": { "External id": 20047,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651204133.579, "dur": 70.726, "args": { "External id": 20048,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204137.384, "dur": 6.782, "args": { "External id": 20049,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651204146.169, "dur": 57.300, "args": { "External id": 20050,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2641 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.19", "pid": 1336754, "tid": 1381179, "ts": 1295651204376.320, "dur": 538.785, "args": { "External id": 20051,"Record function id": 0, "Ev Idx": 2642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651204394.082, "dur": 508.208, "args": { "External id": 20052,"Record function id": 0, "Ev Idx": 2643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651204449.340, "dur": 5.912, "args": { "External id": 20053,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651204472.110, "dur": 30.284, "args": { "External id": 20054,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204477.132, "dur": 1.390, "args": { "External id": 20055,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204480.530, "dur": 0.667, "args": { "External id": 20056,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204482.904, "dur": 0.823, "args": { "External id": 20057,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204485.239, "dur": 0.803, "args": { "External id": 20058,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204487.505, "dur": 0.489, "args": { "External id": 20059,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204489.429, "dur": 0.912, "args": { "External id": 20060,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204491.924, "dur": 0.671, "args": { "External id": 20061,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204494.530, "dur": 0.582, "args": { "External id": 20062,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204496.435, "dur": 0.697, "args": { "External id": 20063,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651204511.776, "dur": 32.292, "args": { "External id": 20064,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2655 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651204575.155, "dur": 101.061, "args": { "External id": 20065,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651204585.652, "dur": 2.990, "args": { "External id": 20066,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651204593.821, "dur": 9.778, "args": { "External id": 20067,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651204597.903, "dur": 5.292, "args": { "External id": 20068,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204601.401, "dur": 0.537, "args": { "External id": 20069,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651204610.974, "dur": 25.985, "args": { "External id": 20070,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204613.185, "dur": 0.472, "args": { "External id": 20071,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204615.347, "dur": 0.838, "args": { "External id": 20072,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204617.846, "dur": 0.830, "args": { "External id": 20073,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204620.419, "dur": 0.634, "args": { "External id": 20074,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204622.542, "dur": 0.570, "args": { "External id": 20075,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204625.008, "dur": 0.493, "args": { "External id": 20076,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204627.014, "dur": 0.731, "args": { "External id": 20077,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204629.251, "dur": 0.902, "args": { "External id": 20078,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651204631.511, "dur": 0.778, "args": { "External id": 20079,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651204648.346, "dur": 20.193, "args": { "External id": 20080,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2671 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651204722.481, "dur": 109.599, "args": { "External id": 20081,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2672 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651204743.723, "dur": 84.925, "args": { "External id": 20082,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2673, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651204753.147, "dur": 71.309, "args": { "External id": 20083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2674 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651204847.975, "dur": 1.794, "args": { "External id": 20084,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2675, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651204930.167, "dur": 1692.481, "args": { "External id": 20085,"Sequence number": 246582, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2676 } }, { "ph": "f", "id": 186, "pid": 1336754, "tid": 1381179, "ts": 1295651204930.167, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205075.854, "dur": 105.589, "args": { "External id": 20086,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2677 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651205221.130, "dur": 57.946, "args": { "External id": 20087,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651205300.638, "dur": 56.501, "args": { "External id": 20088,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205367.654, "dur": 35.332, "args": { "External id": 20089,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205411.197, "dur": 46.715, "args": { "External id": 20090,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205466.718, "dur": 29.987, "args": { "External id": 20091,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205505.233, "dur": 42.348, "args": { "External id": 20092,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2683 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651205572.324, "dur": 22.368, "args": { "External id": 20093,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2684 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651205615.281, "dur": 27.684, "args": { "External id": 20094,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2685 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651205662.256, "dur": 20.420, "args": { "External id": 20095,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2686 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651205695.395, "dur": 15.803, "args": { "External id": 20096,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205720.445, "dur": 30.927, "args": { "External id": 20097,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651205754.946, "dur": 36.791, "args": { "External id": 20098,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2689 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651205819.292, "dur": 212.974, "args": { "External id": 20099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651205902.765, "dur": 7.065, "args": { "External id": 20100,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651205911.923, "dur": 2.484, "args": { "External id": 20101,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2692 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651206067.861, "dur": 28.780, "args": { "External id": 20102,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2693 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651206108.257, "dur": 15.587, "args": { "External id": 20103,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206133.390, "dur": 42.847, "args": { "External id": 20104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206183.502, "dur": 39.092, "args": { "External id": 20105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206244.045, "dur": 31.682, "args": { "External id": 20106,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206282.307, "dur": 32.301, "args": { "External id": 20107,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206322.184, "dur": 21.615, "args": { "External id": 20108,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651206351.033, "dur": 46.354, "args": { "External id": 20109,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2700 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651206421.347, "dur": 25.367, "args": { "External id": 20110,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2701 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651206464.069, "dur": 28.037, "args": { "External id": 20111,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2702 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651206505.357, "dur": 17.612, "args": { "External id": 20112,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2703 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651206545.103, "dur": 17.097, "args": { "External id": 20113,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2704 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651206574.327, "dur": 16.970, "args": { "External id": 20114,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2705 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206667.697, "dur": 14.993, "args": { "External id": 20115,"Record function id": 0, "Ev Idx": 2706 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206670.910, "dur": 10.804, "args": { "External id": 20116,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206674.990, "dur": 5.889, "args": { "External id": 20117,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2708 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206676.638, "dur": 4.132, "args": { "External id": 20118,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2709 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206686.725, "dur": 5.137, "args": { "External id": 20119,"Record function id": 0, "Ev Idx": 2710 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206687.940, "dur": 3.497, "args": { "External id": 20120,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206688.775, "dur": 2.208, "args": { "External id": 20121,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2712 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206689.277, "dur": 1.617, "args": { "External id": 20122,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2713 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206695.546, "dur": 3.790, "args": { "External id": 20123,"Record function id": 0, "Ev Idx": 2714 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206696.808, "dur": 2.078, "args": { "External id": 20124,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206697.334, "dur": 1.159, "args": { "External id": 20125,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2716 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206697.650, "dur": 0.765, "args": { "External id": 20126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2717 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206702.703, "dur": 3.738, "args": { "External id": 20127,"Record function id": 0, "Ev Idx": 2718 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206703.769, "dur": 2.268, "args": { "External id": 20128,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206704.300, "dur": 1.274, "args": { "External id": 20129,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2720 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206704.762, "dur": 0.752, "args": { "External id": 20130,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206709.766, "dur": 3.563, "args": { "External id": 20131,"Record function id": 0, "Ev Idx": 2722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206710.856, "dur": 2.070, "args": { "External id": 20132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206711.431, "dur": 1.061, "args": { "External id": 20133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206711.859, "dur": 0.573, "args": { "External id": 20134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2725 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206716.488, "dur": 3.249, "args": { "External id": 20135,"Record function id": 0, "Ev Idx": 2726 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206717.591, "dur": 1.743, "args": { "External id": 20136,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206718.017, "dur": 0.929, "args": { "External id": 20137,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2728 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206718.294, "dur": 0.591, "args": { "External id": 20138,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2729 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206722.888, "dur": 3.861, "args": { "External id": 20139,"Record function id": 0, "Ev Idx": 2730 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206723.868, "dur": 2.497, "args": { "External id": 20140,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206724.449, "dur": 1.485, "args": { "External id": 20141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2732 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206725.085, "dur": 0.790, "args": { "External id": 20142,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2733 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206730.171, "dur": 3.914, "args": { "External id": 20143,"Record function id": 0, "Ev Idx": 2734 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206731.358, "dur": 2.336, "args": { "External id": 20144,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206731.816, "dur": 1.471, "args": { "External id": 20145,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2736 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206732.286, "dur": 0.903, "args": { "External id": 20146,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2737 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206737.271, "dur": 3.323, "args": { "External id": 20147,"Record function id": 0, "Ev Idx": 2738 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651206738.276, "dur": 1.940, "args": { "External id": 20148,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206738.701, "dur": 1.122, "args": { "External id": 20149,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2740 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651206738.985, "dur": 0.775, "args": { "External id": 20150,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2741 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651206744.494, "dur": 35606.627, "args": { "External id": 20151,"Record function id": 0, "Sequence number": 246581, "Fwd thread id": 1, "Ev Idx": 2742 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651206745.863, "dur": 35596.591, "args": { "External id": 20152,"Sequence number": 246581, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2743 } }, { "ph": "f", "id": 187, "pid": 1336754, "tid": 1381179, "ts": 1295651206745.863, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651206774.665, "dur": 35.577, "args": { "External id": 20153,"Record function id": 0, "Ev Idx": 2744 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651206817.791, "dur": 64.203, "args": { "External id": 20154,"Record function id": 0, "Ev Idx": 2745 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.20)", "pid": 1336754, "tid": 1381179, "ts": 1295651206888.831, "dur": 35444.308, "args": { "External id": 20155,"Record function id": 0, "Ev Idx": 2746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651206975.694, "dur": 6.380, "args": { "External id": 20156,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651207031.473, "dur": 5.301, "args": { "External id": 20157,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2748 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651207052.482, "dur": 34407.493, "args": { "External id": 20158,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651207065.648, "dur": 34381.908, "args": { "External id": 20159,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651207137.654, "dur": 17.369, "args": { "External id": 20160,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651207161.743, "dur": 34226.995, "args": { "External id": 20161,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651207164.636, "dur": 34222.895, "args": { "External id": 20162,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651207168.962, "dur": 6.168, "args": { "External id": 20163,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651207176.991, "dur": 34203.105, "args": { "External id": 20164,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651241574.245, "dur": 13.755, "args": { "External id": 20165,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651241578.555, "dur": 9.066, "args": { "External id": 20166,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651241624.759, "dur": 355.504, "args": { "External id": 20167,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651241655.472, "dur": 320.070, "args": { "External id": 20168,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2759, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651241668.186, "dur": 301.835, "args": { "External id": 20169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651242034.918, "dur": 3.369, "args": { "External id": 20170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2761, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242103.042, "dur": 7.261, "args": { "External id": 20171,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242156.478, "dur": 1.682, "args": { "External id": 20172,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242175.138, "dur": 0.859, "args": { "External id": 20173,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242188.101, "dur": 1.099, "args": { "External id": 20174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242201.066, "dur": 0.927, "args": { "External id": 20175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242211.747, "dur": 1.090, "args": { "External id": 20176,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242223.792, "dur": 1.229, "args": { "External id": 20177,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242253.423, "dur": 3.026, "args": { "External id": 20178,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242267.145, "dur": 1.027, "args": { "External id": 20179,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2770 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651242366.954, "dur": 2715.317, "args": { "External id": 20180,"Record function id": 0, "Ev Idx": 2771 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651242386.802, "dur": 1021.870, "args": { "External id": 20181,"Record function id": 0, "Ev Idx": 2772 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651242403.555, "dur": 312.224, "args": { "External id": 20182,"Record function id": 0, "Ev Idx": 2773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242477.497, "dur": 4.344, "args": { "External id": 20183,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242485.561, "dur": 0.838, "args": { "External id": 20184,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242488.983, "dur": 0.674, "args": { "External id": 20185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242491.193, "dur": 0.866, "args": { "External id": 20186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242493.367, "dur": 0.707, "args": { "External id": 20187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242499.837, "dur": 0.982, "args": { "External id": 20188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242502.394, "dur": 2.140, "args": { "External id": 20189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242505.826, "dur": 0.675, "args": { "External id": 20190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242507.683, "dur": 0.934, "args": { "External id": 20191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651242511.592, "dur": 0.820, "args": { "External id": 20192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2783 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651242528.787, "dur": 155.413, "args": { "External id": 20193,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651242548.576, "dur": 131.418, "args": { "External id": 20194,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651242564.242, "dur": 12.535, "args": { "External id": 20195,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651242579.888, "dur": 72.111, "args": { "External id": 20196,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651242582.334, "dur": 69.328, "args": { "External id": 20197,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242586.487, "dur": 6.176, "args": { "External id": 20198,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651242594.336, "dur": 56.704, "args": { "External id": 20199,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2790 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.18", "pid": 1336754, "tid": 1381179, "ts": 1295651242791.157, "dur": 609.658, "args": { "External id": 20200,"Record function id": 0, "Ev Idx": 2791 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651242806.707, "dur": 580.625, "args": { "External id": 20201,"Record function id": 0, "Ev Idx": 2792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651242859.381, "dur": 5.055, "args": { "External id": 20202,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651242880.807, "dur": 28.472, "args": { "External id": 20203,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242886.077, "dur": 1.541, "args": { "External id": 20204,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242889.562, "dur": 0.813, "args": { "External id": 20205,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242892.015, "dur": 0.567, "args": { "External id": 20206,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242893.810, "dur": 0.577, "args": { "External id": 20207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242895.891, "dur": 0.512, "args": { "External id": 20208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242897.892, "dur": 0.702, "args": { "External id": 20209,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242899.823, "dur": 0.483, "args": { "External id": 20210,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242902.074, "dur": 0.253, "args": { "External id": 20211,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651242903.521, "dur": 0.195, "args": { "External id": 20212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651242918.688, "dur": 31.463, "args": { "External id": 20213,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2804 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651242979.462, "dur": 147.322, "args": { "External id": 20214,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651243028.487, "dur": 5.851, "args": { "External id": 20215,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651243040.086, "dur": 12.852, "args": { "External id": 20216,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651243045.798, "dur": 6.746, "args": { "External id": 20217,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243050.182, "dur": 0.724, "args": { "External id": 20218,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651243061.878, "dur": 20.583, "args": { "External id": 20219,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243064.114, "dur": 0.572, "args": { "External id": 20220,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243066.114, "dur": 0.348, "args": { "External id": 20221,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243067.570, "dur": 0.317, "args": { "External id": 20222,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243068.851, "dur": 0.750, "args": { "External id": 20223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243070.812, "dur": 0.429, "args": { "External id": 20224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243072.264, "dur": 0.472, "args": { "External id": 20225,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243073.763, "dur": 0.364, "args": { "External id": 20226,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243075.530, "dur": 0.346, "args": { "External id": 20227,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651243077.624, "dur": 0.361, "args": { "External id": 20228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651243093.735, "dur": 24.994, "args": { "External id": 20229,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2820 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651243174.927, "dur": 135.408, "args": { "External id": 20230,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2821 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651243202.895, "dur": 103.385, "args": { "External id": 20231,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2822, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651243212.337, "dur": 89.311, "args": { "External id": 20232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2823 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651243330.108, "dur": 2.257, "args": { "External id": 20233,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2824, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651243416.803, "dur": 1644.842, "args": { "External id": 20234,"Sequence number": 246580, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2825 } }, { "ph": "f", "id": 188, "pid": 1336754, "tid": 1381179, "ts": 1295651243416.803, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651243525.447, "dur": 102.346, "args": { "External id": 20235,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2826 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651243665.080, "dur": 40.455, "args": { "External id": 20236,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651243721.423, "dur": 48.696, "args": { "External id": 20237,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651243780.673, "dur": 33.140, "args": { "External id": 20238,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651243820.718, "dur": 44.266, "args": { "External id": 20239,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651243872.494, "dur": 28.619, "args": { "External id": 20240,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651243909.053, "dur": 41.119, "args": { "External id": 20241,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2832 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651243973.304, "dur": 63.395, "args": { "External id": 20242,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2833 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651244059.961, "dur": 27.217, "args": { "External id": 20243,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2834 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651244109.648, "dur": 20.197, "args": { "External id": 20244,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2835 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651244146.046, "dur": 16.310, "args": { "External id": 20245,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244171.274, "dur": 34.546, "args": { "External id": 20246,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244208.726, "dur": 51.161, "args": { "External id": 20247,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2838 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651244290.105, "dur": 176.729, "args": { "External id": 20248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651244375.012, "dur": 6.024, "args": { "External id": 20249,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651244382.827, "dur": 2.617, "args": { "External id": 20250,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2841 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651244501.274, "dur": 26.764, "args": { "External id": 20251,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2842 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651244539.570, "dur": 14.203, "args": { "External id": 20252,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244564.391, "dur": 39.402, "args": { "External id": 20253,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244609.599, "dur": 37.778, "args": { "External id": 20254,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244654.617, "dur": 21.595, "args": { "External id": 20255,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244680.539, "dur": 28.842, "args": { "External id": 20256,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244715.216, "dur": 33.363, "args": { "External id": 20257,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651244761.031, "dur": 37.671, "args": { "External id": 20258,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651244820.061, "dur": 23.450, "args": { "External id": 20259,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2850 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651244864.879, "dur": 24.823, "args": { "External id": 20260,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651244904.632, "dur": 21.385, "args": { "External id": 20261,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2852 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651244941.581, "dur": 15.838, "args": { "External id": 20262,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2853 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651244977.203, "dur": 51.306, "args": { "External id": 20263,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 2854 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245104.531, "dur": 14.252, "args": { "External id": 20264,"Record function id": 0, "Ev Idx": 2855 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245107.582, "dur": 10.157, "args": { "External id": 20265,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245111.398, "dur": 5.464, "args": { "External id": 20266,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2857 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245112.922, "dur": 3.840, "args": { "External id": 20267,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2858 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245122.607, "dur": 4.892, "args": { "External id": 20268,"Record function id": 0, "Ev Idx": 2859 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245124.047, "dur": 3.016, "args": { "External id": 20269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245125.018, "dur": 1.507, "args": { "External id": 20270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2861 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245125.579, "dur": 0.878, "args": { "External id": 20271,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2862 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245130.777, "dur": 4.140, "args": { "External id": 20272,"Record function id": 0, "Ev Idx": 2863 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245132.227, "dur": 2.255, "args": { "External id": 20273,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245132.744, "dur": 1.271, "args": { "External id": 20274,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2865 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245133.313, "dur": 0.579, "args": { "External id": 20275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 2866 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245138.130, "dur": 3.723, "args": { "External id": 20276,"Record function id": 0, "Ev Idx": 2867 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245139.343, "dur": 2.112, "args": { "External id": 20277,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245140.045, "dur": 0.975, "args": { "External id": 20278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2869 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245140.322, "dur": 0.622, "args": { "External id": 20279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 2870 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245144.899, "dur": 3.563, "args": { "External id": 20280,"Record function id": 0, "Ev Idx": 2871 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245146.069, "dur": 1.960, "args": { "External id": 20281,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245146.556, "dur": 1.057, "args": { "External id": 20282,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2873 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245146.879, "dur": 0.665, "args": { "External id": 20283,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2874 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245151.602, "dur": 4.077, "args": { "External id": 20284,"Record function id": 0, "Ev Idx": 2875 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245152.673, "dur": 2.602, "args": { "External id": 20285,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245153.524, "dur": 1.320, "args": { "External id": 20286,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2877 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245154.004, "dur": 0.773, "args": { "External id": 20287,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2878 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245158.697, "dur": 3.105, "args": { "External id": 20288,"Record function id": 0, "Ev Idx": 2879 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245159.580, "dur": 1.811, "args": { "External id": 20289,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245160.051, "dur": 0.934, "args": { "External id": 20290,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2881 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245160.335, "dur": 0.582, "args": { "External id": 20291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2882 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245164.816, "dur": 3.534, "args": { "External id": 20292,"Record function id": 0, "Ev Idx": 2883 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245165.881, "dur": 2.071, "args": { "External id": 20293,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245166.382, "dur": 1.163, "args": { "External id": 20294,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2885 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245166.734, "dur": 0.743, "args": { "External id": 20295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 2886 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245171.359, "dur": 5.649, "args": { "External id": 20296,"Record function id": 0, "Ev Idx": 2887 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651245172.378, "dur": 4.228, "args": { "External id": 20297,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245172.858, "dur": 3.309, "args": { "External id": 20298,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2889 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651245175.510, "dur": 0.556, "args": { "External id": 20299,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 2890 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651245180.767, "dur": 35862.294, "args": { "External id": 20300,"Record function id": 0, "Sequence number": 246579, "Fwd thread id": 1, "Ev Idx": 2891 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651245182.068, "dur": 35850.893, "args": { "External id": 20301,"Sequence number": 246579, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2892 } }, { "ph": "f", "id": 189, "pid": 1336754, "tid": 1381179, "ts": 1295651245182.068, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651245210.808, "dur": 54.286, "args": { "External id": 20302,"Record function id": 0, "Ev Idx": 2893 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651245276.778, "dur": 66.654, "args": { "External id": 20303,"Record function id": 0, "Ev Idx": 2894 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.19)", "pid": 1336754, "tid": 1381179, "ts": 1295651245349.861, "dur": 35673.221, "args": { "External id": 20304,"Record function id": 0, "Ev Idx": 2895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651245438.671, "dur": 10.453, "args": { "External id": 20305,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651245459.365, "dur": 5.002, "args": { "External id": 20306,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2897 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651245478.113, "dur": 34695.243, "args": { "External id": 20307,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651245491.194, "dur": 34673.265, "args": { "External id": 20308,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 2899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651245540.402, "dur": 14.042, "args": { "External id": 20309,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651245560.643, "dur": 34564.963, "args": { "External id": 20310,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 2901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651245563.393, "dur": 34561.506, "args": { "External id": 20311,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 2902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651245567.138, "dur": 4.795, "args": { "External id": 20312,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651245573.686, "dur": 34547.307, "args": { "External id": 20313,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 2904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651280282.283, "dur": 9.893, "args": { "External id": 20314,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 2905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651280284.938, "dur": 6.638, "args": { "External id": 20315,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651280322.049, "dur": 386.642, "args": { "External id": 20316,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 2907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651280352.466, "dur": 351.306, "args": { "External id": 20317,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2908, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651280363.190, "dur": 334.674, "args": { "External id": 20318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 2909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651280733.455, "dur": 2.376, "args": { "External id": 20319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2910, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280794.835, "dur": 6.782, "args": { "External id": 20320,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280846.265, "dur": 1.500, "args": { "External id": 20321,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280862.835, "dur": 1.215, "args": { "External id": 20322,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280875.495, "dur": 1.023, "args": { "External id": 20323,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280888.501, "dur": 0.913, "args": { "External id": 20324,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280898.622, "dur": 0.963, "args": { "External id": 20325,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280909.719, "dur": 1.042, "args": { "External id": 20326,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280919.760, "dur": 1.968, "args": { "External id": 20327,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651280930.728, "dur": 0.716, "args": { "External id": 20328,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2919 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651281059.840, "dur": 2649.150, "args": { "External id": 20329,"Record function id": 0, "Ev Idx": 2920 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651281079.972, "dur": 1000.590, "args": { "External id": 20330,"Record function id": 0, "Ev Idx": 2921 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651281094.931, "dur": 330.335, "args": { "External id": 20331,"Record function id": 0, "Ev Idx": 2922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281173.167, "dur": 4.375, "args": { "External id": 20332,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 2923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281183.149, "dur": 1.144, "args": { "External id": 20333,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281185.838, "dur": 0.955, "args": { "External id": 20334,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281188.346, "dur": 0.747, "args": { "External id": 20335,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281190.385, "dur": 0.908, "args": { "External id": 20336,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281194.702, "dur": 0.749, "args": { "External id": 20337,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 2928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281196.747, "dur": 1.486, "args": { "External id": 20338,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 2929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281199.570, "dur": 0.535, "args": { "External id": 20339,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281201.419, "dur": 0.727, "args": { "External id": 20340,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651281204.863, "dur": 0.702, "args": { "External id": 20341,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 2932 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651281223.867, "dur": 170.849, "args": { "External id": 20342,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651281256.442, "dur": 133.470, "args": { "External id": 20343,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 2934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651281274.339, "dur": 13.108, "args": { "External id": 20344,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651281290.336, "dur": 65.999, "args": { "External id": 20345,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 2936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651281292.716, "dur": 63.319, "args": { "External id": 20346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 2937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281296.580, "dur": 5.181, "args": { "External id": 20347,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651281303.623, "dur": 51.946, "args": { "External id": 20348,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 2939 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.17", "pid": 1336754, "tid": 1381179, "ts": 1295651281508.654, "dur": 564.212, "args": { "External id": 20349,"Record function id": 0, "Ev Idx": 2940 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651281524.126, "dur": 535.227, "args": { "External id": 20350,"Record function id": 0, "Ev Idx": 2941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651281576.303, "dur": 5.141, "args": { "External id": 20351,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651281597.222, "dur": 27.412, "args": { "External id": 20352,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281602.200, "dur": 1.465, "args": { "External id": 20353,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281605.349, "dur": 0.599, "args": { "External id": 20354,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281607.662, "dur": 0.330, "args": { "External id": 20355,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281609.456, "dur": 0.347, "args": { "External id": 20356,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281610.926, "dur": 0.554, "args": { "External id": 20357,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281612.673, "dur": 0.800, "args": { "External id": 20358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281616.949, "dur": 0.322, "args": { "External id": 20359,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281618.517, "dur": 0.347, "args": { "External id": 20360,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281619.734, "dur": 0.287, "args": { "External id": 20361,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651281633.600, "dur": 33.122, "args": { "External id": 20362,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2953 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651281697.637, "dur": 95.206, "args": { "External id": 20363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 2954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651281707.192, "dur": 3.357, "args": { "External id": 20364,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651281715.602, "dur": 10.407, "args": { "External id": 20365,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651281720.875, "dur": 4.741, "args": { "External id": 20366,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 2957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281723.813, "dur": 0.527, "args": { "External id": 20367,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 2958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651281732.875, "dur": 17.788, "args": { "External id": 20368,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 2959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281734.698, "dur": 0.611, "args": { "External id": 20369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281736.592, "dur": 0.377, "args": { "External id": 20370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281737.908, "dur": 0.273, "args": { "External id": 20371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281739.404, "dur": 0.304, "args": { "External id": 20372,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281740.887, "dur": 0.316, "args": { "External id": 20373,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281742.253, "dur": 0.248, "args": { "External id": 20374,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281743.645, "dur": 0.431, "args": { "External id": 20375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281745.046, "dur": 0.385, "args": { "External id": 20376,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651281746.585, "dur": 0.591, "args": { "External id": 20377,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 2968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651281764.921, "dur": 20.763, "args": { "External id": 20378,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 2969 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651281833.779, "dur": 115.244, "args": { "External id": 20379,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 2970 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651281861.598, "dur": 84.359, "args": { "External id": 20380,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 2971, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651281870.248, "dur": 71.565, "args": { "External id": 20381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 2972 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651281965.794, "dur": 1.761, "args": { "External id": 20382,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 2973, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651282087.745, "dur": 1602.817, "args": { "External id": 20383,"Sequence number": 246578, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 2974 } }, { "ph": "f", "id": 190, "pid": 1336754, "tid": 1381179, "ts": 1295651282087.745, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282193.436, "dur": 120.867, "args": { "External id": 20384,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 2975 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651282357.907, "dur": 39.650, "args": { "External id": 20385,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 2976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651282413.790, "dur": 51.984, "args": { "External id": 20386,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 2977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282475.150, "dur": 34.361, "args": { "External id": 20387,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282515.629, "dur": 44.079, "args": { "External id": 20388,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282566.856, "dur": 26.774, "args": { "External id": 20389,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 2980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282601.029, "dur": 41.181, "args": { "External id": 20390,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 2981 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651282665.590, "dur": 24.111, "args": { "External id": 20391,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 2982 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651282710.377, "dur": 26.767, "args": { "External id": 20392,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2983 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651282758.723, "dur": 19.527, "args": { "External id": 20393,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 2984 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651282792.195, "dur": 16.035, "args": { "External id": 20394,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 2985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282818.017, "dur": 31.170, "args": { "External id": 20395,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651282852.328, "dur": 31.910, "args": { "External id": 20396,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2987 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651282908.715, "dur": 208.236, "args": { "External id": 20397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 2988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651283020.489, "dur": 7.114, "args": { "External id": 20398,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651283029.892, "dur": 2.202, "args": { "External id": 20399,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 2990 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651283148.371, "dur": 28.852, "args": { "External id": 20400,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2991 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651283188.048, "dur": 14.842, "args": { "External id": 20401,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 2992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283210.963, "dur": 60.232, "args": { "External id": 20402,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283280.041, "dur": 38.573, "args": { "External id": 20403,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283329.495, "dur": 22.842, "args": { "External id": 20404,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283356.876, "dur": 32.925, "args": { "External id": 20405,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283396.067, "dur": 21.359, "args": { "External id": 20406,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 2997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651283423.613, "dur": 28.828, "args": { "External id": 20407,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 2998 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651283474.311, "dur": 36.437, "args": { "External id": 20408,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 2999 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651283537.328, "dur": 29.893, "args": { "External id": 20409,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3000 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651283582.142, "dur": 18.232, "args": { "External id": 20410,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3001 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651283615.867, "dur": 15.455, "args": { "External id": 20411,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3002 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651283644.662, "dur": 15.240, "args": { "External id": 20412,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3003 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283734.311, "dur": 14.112, "args": { "External id": 20413,"Record function id": 0, "Ev Idx": 3004 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283737.460, "dur": 10.140, "args": { "External id": 20414,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283741.276, "dur": 5.417, "args": { "External id": 20415,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3006 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283742.664, "dur": 3.931, "args": { "External id": 20416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3007 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283752.505, "dur": 4.049, "args": { "External id": 20417,"Record function id": 0, "Ev Idx": 3008 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283753.680, "dur": 2.443, "args": { "External id": 20418,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283754.374, "dur": 1.253, "args": { "External id": 20419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3010 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283754.707, "dur": 0.853, "args": { "External id": 20420,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3011 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283759.927, "dur": 4.230, "args": { "External id": 20421,"Record function id": 0, "Ev Idx": 3012 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283761.123, "dur": 2.603, "args": { "External id": 20422,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283761.647, "dur": 1.640, "args": { "External id": 20423,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3014 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283762.347, "dur": 0.840, "args": { "External id": 20424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3015 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283767.304, "dur": 3.454, "args": { "External id": 20425,"Record function id": 0, "Ev Idx": 3016 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283768.267, "dur": 2.089, "args": { "External id": 20426,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283768.777, "dur": 1.130, "args": { "External id": 20427,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3018 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283769.171, "dur": 0.641, "args": { "External id": 20428,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3019 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283773.865, "dur": 3.464, "args": { "External id": 20429,"Record function id": 0, "Ev Idx": 3020 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283774.768, "dur": 2.119, "args": { "External id": 20430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283775.483, "dur": 0.994, "args": { "External id": 20431,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3022 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283775.750, "dur": 0.660, "args": { "External id": 20432,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3023 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283780.459, "dur": 3.640, "args": { "External id": 20433,"Record function id": 0, "Ev Idx": 3024 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283781.429, "dur": 2.279, "args": { "External id": 20434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283781.903, "dur": 1.389, "args": { "External id": 20435,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3026 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283782.361, "dur": 0.831, "args": { "External id": 20436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3027 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283787.384, "dur": 3.897, "args": { "External id": 20437,"Record function id": 0, "Ev Idx": 3028 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283788.257, "dur": 2.583, "args": { "External id": 20438,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283789.222, "dur": 1.190, "args": { "External id": 20439,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3030 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283789.734, "dur": 0.563, "args": { "External id": 20440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3031 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283794.301, "dur": 3.502, "args": { "External id": 20441,"Record function id": 0, "Ev Idx": 3032 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283795.270, "dur": 2.144, "args": { "External id": 20442,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283795.852, "dur": 1.153, "args": { "External id": 20443,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3034 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283796.129, "dur": 0.809, "args": { "External id": 20444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3035 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283800.943, "dur": 3.567, "args": { "External id": 20445,"Record function id": 0, "Ev Idx": 3036 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651283801.959, "dur": 2.112, "args": { "External id": 20446,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283802.415, "dur": 1.256, "args": { "External id": 20447,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3038 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651283802.837, "dur": 0.768, "args": { "External id": 20448,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3039 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651283808.118, "dur": 36141.517, "args": { "External id": 20449,"Record function id": 0, "Sequence number": 246577, "Fwd thread id": 1, "Ev Idx": 3040 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651283809.209, "dur": 36132.292, "args": { "External id": 20450,"Sequence number": 246577, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3041 } }, { "ph": "f", "id": 191, "pid": 1336754, "tid": 1381179, "ts": 1295651283809.209, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651283837.525, "dur": 37.415, "args": { "External id": 20451,"Record function id": 0, "Ev Idx": 3042 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651283882.716, "dur": 58.842, "args": { "External id": 20452,"Record function id": 0, "Ev Idx": 3043 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.18)", "pid": 1336754, "tid": 1381179, "ts": 1295651283947.342, "dur": 35986.561, "args": { "External id": 20453,"Record function id": 0, "Ev Idx": 3044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651284080.322, "dur": 7.181, "args": { "External id": 20454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651284100.818, "dur": 4.906, "args": { "External id": 20455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3046 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651284120.370, "dur": 35006.138, "args": { "External id": 20456,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651284143.591, "dur": 34974.990, "args": { "External id": 20457,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651284213.149, "dur": 14.356, "args": { "External id": 20458,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651284249.972, "dur": 34827.143, "args": { "External id": 20459,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651284252.820, "dur": 34823.702, "args": { "External id": 20460,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651284256.901, "dur": 9.728, "args": { "External id": 20461,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651284268.559, "dur": 34804.739, "args": { "External id": 20462,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651319215.430, "dur": 9.388, "args": { "External id": 20463,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651319217.939, "dur": 6.538, "args": { "External id": 20464,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651319265.304, "dur": 384.485, "args": { "External id": 20465,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651319296.528, "dur": 348.528, "args": { "External id": 20466,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3057, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651319307.608, "dur": 332.018, "args": { "External id": 20467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651319671.987, "dur": 2.460, "args": { "External id": 20468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3059, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319736.243, "dur": 6.777, "args": { "External id": 20469,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319786.684, "dur": 1.330, "args": { "External id": 20470,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319802.558, "dur": 1.361, "args": { "External id": 20471,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319816.120, "dur": 1.051, "args": { "External id": 20472,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319829.195, "dur": 1.026, "args": { "External id": 20473,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319839.993, "dur": 0.875, "args": { "External id": 20474,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319851.066, "dur": 0.849, "args": { "External id": 20475,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319862.075, "dur": 1.982, "args": { "External id": 20476,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651319873.608, "dur": 0.841, "args": { "External id": 20477,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3068 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651319963.483, "dur": 2743.514, "args": { "External id": 20478,"Record function id": 0, "Ev Idx": 3069 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651320031.597, "dur": 1029.055, "args": { "External id": 20479,"Record function id": 0, "Ev Idx": 3070 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651320051.016, "dur": 349.300, "args": { "External id": 20480,"Record function id": 0, "Ev Idx": 3071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320152.825, "dur": 5.212, "args": { "External id": 20481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320163.750, "dur": 1.181, "args": { "External id": 20482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320166.493, "dur": 0.908, "args": { "External id": 20483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320168.701, "dur": 0.875, "args": { "External id": 20484,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320170.846, "dur": 0.923, "args": { "External id": 20485,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320174.571, "dur": 0.593, "args": { "External id": 20486,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320176.518, "dur": 1.709, "args": { "External id": 20487,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320179.499, "dur": 0.710, "args": { "External id": 20488,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320181.295, "dur": 0.687, "args": { "External id": 20489,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651320185.049, "dur": 0.942, "args": { "External id": 20490,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3081 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651320202.155, "dur": 165.521, "args": { "External id": 20491,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651320219.247, "dur": 143.169, "args": { "External id": 20492,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651320249.585, "dur": 14.442, "args": { "External id": 20493,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651320267.108, "dur": 67.828, "args": { "External id": 20494,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651320269.218, "dur": 65.134, "args": { "External id": 20495,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320273.105, "dur": 5.706, "args": { "External id": 20496,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651320280.422, "dur": 53.370, "args": { "External id": 20497,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3088 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.16", "pid": 1336754, "tid": 1381179, "ts": 1295651320481.002, "dur": 571.163, "args": { "External id": 20498,"Record function id": 0, "Ev Idx": 3089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651320497.989, "dur": 539.871, "args": { "External id": 20499,"Record function id": 0, "Ev Idx": 3090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651320555.878, "dur": 7.962, "args": { "External id": 20500,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651320580.448, "dur": 24.337, "args": { "External id": 20501,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320585.323, "dur": 1.605, "args": { "External id": 20502,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320588.792, "dur": 0.396, "args": { "External id": 20503,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320590.539, "dur": 0.331, "args": { "External id": 20504,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320591.931, "dur": 0.537, "args": { "External id": 20505,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320593.617, "dur": 0.358, "args": { "External id": 20506,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320595.343, "dur": 0.282, "args": { "External id": 20507,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320596.835, "dur": 0.453, "args": { "External id": 20508,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320598.236, "dur": 0.342, "args": { "External id": 20509,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320599.678, "dur": 0.227, "args": { "External id": 20510,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651320614.513, "dur": 31.236, "args": { "External id": 20511,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3102 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651320675.235, "dur": 95.637, "args": { "External id": 20512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651320684.590, "dur": 3.453, "args": { "External id": 20513,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651320693.107, "dur": 11.441, "args": { "External id": 20514,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651320699.136, "dur": 5.014, "args": { "External id": 20515,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320702.289, "dur": 0.709, "args": { "External id": 20516,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651320711.699, "dur": 18.144, "args": { "External id": 20517,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320714.486, "dur": 0.485, "args": { "External id": 20518,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320716.353, "dur": 0.483, "args": { "External id": 20519,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320717.854, "dur": 0.344, "args": { "External id": 20520,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320719.348, "dur": 0.293, "args": { "External id": 20521,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320720.815, "dur": 0.178, "args": { "External id": 20522,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320722.093, "dur": 0.493, "args": { "External id": 20523,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320723.438, "dur": 0.382, "args": { "External id": 20524,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320724.705, "dur": 0.265, "args": { "External id": 20525,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651320726.121, "dur": 0.199, "args": { "External id": 20526,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651320743.529, "dur": 20.363, "args": { "External id": 20527,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3118 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651320814.060, "dur": 118.216, "args": { "External id": 20528,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3119 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651320842.642, "dur": 86.305, "args": { "External id": 20529,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3120, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651320851.944, "dur": 72.075, "args": { "External id": 20530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3121 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651320947.943, "dur": 1.819, "args": { "External id": 20531,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3122, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651321068.810, "dur": 1618.833, "args": { "External id": 20532,"Sequence number": 246576, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3123 } }, { "ph": "f", "id": 192, "pid": 1336754, "tid": 1381179, "ts": 1295651321068.810, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321173.304, "dur": 122.654, "args": { "External id": 20533,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3124 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651321338.713, "dur": 39.760, "args": { "External id": 20534,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651321395.415, "dur": 52.912, "args": { "External id": 20535,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321458.321, "dur": 33.160, "args": { "External id": 20536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321497.941, "dur": 44.747, "args": { "External id": 20537,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321549.741, "dur": 28.124, "args": { "External id": 20538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321584.936, "dur": 41.900, "args": { "External id": 20539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3130 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651321650.213, "dur": 23.732, "args": { "External id": 20540,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3131 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651321692.721, "dur": 27.592, "args": { "External id": 20541,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3132 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651321740.416, "dur": 19.044, "args": { "External id": 20542,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3133 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651321774.183, "dur": 15.903, "args": { "External id": 20543,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321798.397, "dur": 30.468, "args": { "External id": 20544,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651321831.834, "dur": 32.253, "args": { "External id": 20545,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3136 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651321888.581, "dur": 205.022, "args": { "External id": 20546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651321963.233, "dur": 5.971, "args": { "External id": 20547,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651321971.131, "dur": 2.391, "args": { "External id": 20548,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3139 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651322130.885, "dur": 27.957, "args": { "External id": 20549,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3140 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651322176.505, "dur": 15.104, "args": { "External id": 20550,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322200.966, "dur": 63.998, "args": { "External id": 20551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322273.653, "dur": 43.897, "args": { "External id": 20552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322325.812, "dur": 23.189, "args": { "External id": 20553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322353.674, "dur": 30.421, "args": { "External id": 20554,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322390.306, "dur": 22.217, "args": { "External id": 20555,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651322420.164, "dur": 29.235, "args": { "External id": 20556,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3147 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651322484.965, "dur": 29.287, "args": { "External id": 20557,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3148 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651322534.625, "dur": 25.356, "args": { "External id": 20558,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3149 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651322576.992, "dur": 18.774, "args": { "External id": 20559,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3150 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651322611.818, "dur": 19.459, "args": { "External id": 20560,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3151 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651322644.124, "dur": 16.186, "args": { "External id": 20561,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3152 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322728.698, "dur": 15.639, "args": { "External id": 20562,"Record function id": 0, "Ev Idx": 3153 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322732.085, "dur": 11.309, "args": { "External id": 20563,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322736.125, "dur": 6.329, "args": { "External id": 20564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3155 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322737.805, "dur": 4.563, "args": { "External id": 20565,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3156 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322748.245, "dur": 4.990, "args": { "External id": 20566,"Record function id": 0, "Ev Idx": 3157 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322749.594, "dur": 3.195, "args": { "External id": 20567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322750.683, "dur": 1.593, "args": { "External id": 20568,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3159 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322751.400, "dur": 0.812, "args": { "External id": 20569,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3160 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322756.553, "dur": 4.348, "args": { "External id": 20570,"Record function id": 0, "Ev Idx": 3161 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322757.733, "dur": 2.698, "args": { "External id": 20571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322758.259, "dur": 1.733, "args": { "External id": 20572,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3163 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322759.057, "dur": 0.850, "args": { "External id": 20573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3164 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322764.111, "dur": 4.634, "args": { "External id": 20574,"Record function id": 0, "Ev Idx": 3165 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322765.194, "dur": 3.143, "args": { "External id": 20575,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322766.109, "dur": 1.820, "args": { "External id": 20576,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3167 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322766.589, "dur": 1.238, "args": { "External id": 20577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3168 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322771.903, "dur": 4.926, "args": { "External id": 20578,"Record function id": 0, "Ev Idx": 3169 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322773.129, "dur": 3.278, "args": { "External id": 20579,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322774.145, "dur": 1.757, "args": { "External id": 20580,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3171 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322774.799, "dur": 1.042, "args": { "External id": 20581,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3172 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322779.983, "dur": 4.204, "args": { "External id": 20582,"Record function id": 0, "Ev Idx": 3173 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322781.109, "dur": 2.667, "args": { "External id": 20583,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322781.838, "dur": 1.490, "args": { "External id": 20584,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3175 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322782.378, "dur": 0.863, "args": { "External id": 20585,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3176 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322787.402, "dur": 3.697, "args": { "External id": 20586,"Record function id": 0, "Ev Idx": 3177 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322788.384, "dur": 2.291, "args": { "External id": 20587,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322788.833, "dur": 1.421, "args": { "External id": 20588,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3179 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322789.374, "dur": 0.767, "args": { "External id": 20589,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3180 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322794.328, "dur": 3.569, "args": { "External id": 20590,"Record function id": 0, "Ev Idx": 3181 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322795.308, "dur": 2.192, "args": { "External id": 20591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322795.749, "dur": 1.339, "args": { "External id": 20592,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3183 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322796.061, "dur": 0.940, "args": { "External id": 20593,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3184 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322801.081, "dur": 4.248, "args": { "External id": 20594,"Record function id": 0, "Ev Idx": 3185 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651322801.962, "dur": 2.954, "args": { "External id": 20595,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322802.409, "dur": 2.111, "args": { "External id": 20596,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3187 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651322803.023, "dur": 1.431, "args": { "External id": 20597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3188 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651322809.256, "dur": 36375.363, "args": { "External id": 20598,"Record function id": 0, "Sequence number": 246575, "Fwd thread id": 1, "Ev Idx": 3189 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651322810.593, "dur": 36365.136, "args": { "External id": 20599,"Sequence number": 246575, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3190 } }, { "ph": "f", "id": 193, "pid": 1336754, "tid": 1381179, "ts": 1295651322810.593, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651322839.589, "dur": 37.400, "args": { "External id": 20600,"Record function id": 0, "Ev Idx": 3191 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651322884.808, "dur": 59.060, "args": { "External id": 20601,"Record function id": 0, "Ev Idx": 3192 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.17)", "pid": 1336754, "tid": 1381179, "ts": 1295651322949.663, "dur": 36218.665, "args": { "External id": 20602,"Record function id": 0, "Ev Idx": 3193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651323080.292, "dur": 7.086, "args": { "External id": 20603,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651323100.554, "dur": 5.297, "args": { "External id": 20604,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3195 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651323120.341, "dur": 35251.386, "args": { "External id": 20605,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651323134.155, "dur": 35229.017, "args": { "External id": 20606,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651323194.423, "dur": 17.294, "args": { "External id": 20607,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651323217.802, "dur": 35108.541, "args": { "External id": 20608,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651323220.262, "dur": 35105.498, "args": { "External id": 20609,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651323223.757, "dur": 20.814, "args": { "External id": 20610,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651323247.151, "dur": 35075.068, "args": { "External id": 20611,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651358461.078, "dur": 8.433, "args": { "External id": 20612,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651358463.709, "dur": 5.478, "args": { "External id": 20613,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651358497.032, "dur": 340.923, "args": { "External id": 20614,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651358527.837, "dur": 305.754, "args": { "External id": 20615,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3206, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651358538.577, "dur": 289.808, "args": { "External id": 20616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651358859.488, "dur": 2.418, "args": { "External id": 20617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3208, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651358916.212, "dur": 6.548, "args": { "External id": 20618,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651358965.090, "dur": 2.116, "args": { "External id": 20619,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359027.687, "dur": 2.022, "args": { "External id": 20620,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359046.777, "dur": 1.102, "args": { "External id": 20621,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359059.193, "dur": 0.916, "args": { "External id": 20622,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359069.619, "dur": 1.016, "args": { "External id": 20623,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359081.394, "dur": 0.987, "args": { "External id": 20624,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359093.272, "dur": 1.002, "args": { "External id": 20625,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359106.349, "dur": 1.343, "args": { "External id": 20626,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3217 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651359199.974, "dur": 2640.765, "args": { "External id": 20627,"Record function id": 0, "Ev Idx": 3218 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651359218.909, "dur": 998.140, "args": { "External id": 20628,"Record function id": 0, "Ev Idx": 3219 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651359248.070, "dur": 314.621, "args": { "External id": 20629,"Record function id": 0, "Ev Idx": 3220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359327.303, "dur": 4.948, "args": { "External id": 20630,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359335.876, "dur": 1.213, "args": { "External id": 20631,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359338.782, "dur": 1.629, "args": { "External id": 20632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359341.890, "dur": 1.143, "args": { "External id": 20633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359346.345, "dur": 1.390, "args": { "External id": 20634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359349.128, "dur": 1.389, "args": { "External id": 20635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359352.000, "dur": 1.128, "args": { "External id": 20636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359354.373, "dur": 0.955, "args": { "External id": 20637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359358.254, "dur": 1.438, "args": { "External id": 20638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651359361.040, "dur": 1.639, "args": { "External id": 20639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3230 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651359379.931, "dur": 151.027, "args": { "External id": 20640,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651359395.726, "dur": 131.100, "args": { "External id": 20641,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651359413.431, "dur": 12.162, "args": { "External id": 20642,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651359428.611, "dur": 69.856, "args": { "External id": 20643,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651359430.819, "dur": 67.301, "args": { "External id": 20644,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359434.088, "dur": 5.699, "args": { "External id": 20645,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651359443.330, "dur": 54.323, "args": { "External id": 20646,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3237 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.15", "pid": 1336754, "tid": 1381179, "ts": 1295651359639.686, "dur": 569.240, "args": { "External id": 20647,"Record function id": 0, "Ev Idx": 3238 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651359656.289, "dur": 539.331, "args": { "External id": 20648,"Record function id": 0, "Ev Idx": 3239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651359709.897, "dur": 5.057, "args": { "External id": 20649,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651359731.206, "dur": 24.071, "args": { "External id": 20650,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359735.917, "dur": 2.103, "args": { "External id": 20651,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359739.416, "dur": 0.370, "args": { "External id": 20652,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359741.209, "dur": 0.667, "args": { "External id": 20653,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359743.133, "dur": 0.510, "args": { "External id": 20654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359744.467, "dur": 0.448, "args": { "External id": 20655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359745.772, "dur": 0.602, "args": { "External id": 20656,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359747.270, "dur": 0.774, "args": { "External id": 20657,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359749.038, "dur": 0.894, "args": { "External id": 20658,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359750.946, "dur": 0.582, "args": { "External id": 20659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651359764.421, "dur": 30.687, "args": { "External id": 20660,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3251 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651359824.387, "dur": 98.343, "args": { "External id": 20661,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651359833.839, "dur": 3.463, "args": { "External id": 20662,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651359842.016, "dur": 10.447, "args": { "External id": 20663,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651359845.893, "dur": 6.169, "args": { "External id": 20664,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359848.800, "dur": 1.133, "args": { "External id": 20665,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651359858.793, "dur": 26.163, "args": { "External id": 20666,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359860.214, "dur": 0.389, "args": { "External id": 20667,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359862.129, "dur": 0.656, "args": { "External id": 20668,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359863.678, "dur": 0.578, "args": { "External id": 20669,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359865.271, "dur": 0.778, "args": { "External id": 20670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359867.729, "dur": 0.784, "args": { "External id": 20671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359870.107, "dur": 0.662, "args": { "External id": 20672,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359872.071, "dur": 0.734, "args": { "External id": 20673,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359873.866, "dur": 0.697, "args": { "External id": 20674,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651359875.792, "dur": 0.739, "args": { "External id": 20675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651359895.404, "dur": 20.098, "args": { "External id": 20676,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3267 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651359965.710, "dur": 157.473, "args": { "External id": 20677,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3268 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651360029.170, "dur": 90.321, "args": { "External id": 20678,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3269, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651360040.381, "dur": 74.958, "args": { "External id": 20679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3270 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651360140.251, "dur": 1.754, "args": { "External id": 20680,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3271, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651360224.112, "dur": 1597.930, "args": { "External id": 20681,"Sequence number": 246574, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3272 } }, { "ph": "f", "id": 194, "pid": 1336754, "tid": 1381179, "ts": 1295651360224.112, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360346.359, "dur": 104.248, "args": { "External id": 20682,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3273 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651360489.479, "dur": 38.089, "args": { "External id": 20683,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651360542.931, "dur": 55.476, "args": { "External id": 20684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360608.071, "dur": 32.970, "args": { "External id": 20685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360647.690, "dur": 43.004, "args": { "External id": 20686,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360705.246, "dur": 28.042, "args": { "External id": 20687,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360740.665, "dur": 40.867, "args": { "External id": 20688,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3279 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651360806.239, "dur": 22.397, "args": { "External id": 20689,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3280 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651360847.829, "dur": 28.589, "args": { "External id": 20690,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3281 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651360896.678, "dur": 19.099, "args": { "External id": 20691,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3282 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651360927.706, "dur": 15.765, "args": { "External id": 20692,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651360952.511, "dur": 67.360, "args": { "External id": 20693,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361026.076, "dur": 36.921, "args": { "External id": 20694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3285 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651361091.779, "dur": 189.920, "args": { "External id": 20695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651361173.311, "dur": 9.404, "args": { "External id": 20696,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651361184.617, "dur": 2.315, "args": { "External id": 20697,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3288 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651361315.074, "dur": 28.822, "args": { "External id": 20698,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3289 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651361354.842, "dur": 16.045, "args": { "External id": 20699,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361379.881, "dur": 39.599, "args": { "External id": 20700,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361425.022, "dur": 34.631, "args": { "External id": 20701,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361466.409, "dur": 21.599, "args": { "External id": 20702,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361493.230, "dur": 28.502, "args": { "External id": 20703,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361527.880, "dur": 21.462, "args": { "External id": 20704,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651361556.710, "dur": 28.638, "args": { "External id": 20705,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651361604.008, "dur": 24.338, "args": { "External id": 20706,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3297 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651361659.338, "dur": 30.905, "args": { "External id": 20707,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651361705.620, "dur": 17.728, "args": { "External id": 20708,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3299 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651361740.536, "dur": 16.563, "args": { "External id": 20709,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3300 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651361773.890, "dur": 17.714, "args": { "External id": 20710,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3301 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361862.792, "dur": 18.474, "args": { "External id": 20711,"Record function id": 0, "Ev Idx": 3302 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361866.272, "dur": 14.127, "args": { "External id": 20712,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361870.087, "dur": 9.297, "args": { "External id": 20713,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3304 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361871.392, "dur": 7.875, "args": { "External id": 20714,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3305 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361885.069, "dur": 4.449, "args": { "External id": 20715,"Record function id": 0, "Ev Idx": 3306 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361886.452, "dur": 2.606, "args": { "External id": 20716,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361887.158, "dur": 1.378, "args": { "External id": 20717,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3308 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361887.590, "dur": 0.881, "args": { "External id": 20718,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3309 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361892.741, "dur": 4.428, "args": { "External id": 20719,"Record function id": 0, "Ev Idx": 3310 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361893.880, "dur": 2.848, "args": { "External id": 20720,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361894.608, "dur": 1.703, "args": { "External id": 20721,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3312 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361895.211, "dur": 0.997, "args": { "External id": 20722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3313 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361900.350, "dur": 4.321, "args": { "External id": 20723,"Record function id": 0, "Ev Idx": 3314 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361901.364, "dur": 2.810, "args": { "External id": 20724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361901.999, "dur": 1.698, "args": { "External id": 20725,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3316 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361902.678, "dur": 0.925, "args": { "External id": 20726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3317 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361907.757, "dur": 4.552, "args": { "External id": 20727,"Record function id": 0, "Ev Idx": 3318 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361908.805, "dur": 3.051, "args": { "External id": 20728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361909.778, "dur": 1.589, "args": { "External id": 20729,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3320 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361910.058, "dur": 1.216, "args": { "External id": 20730,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3321 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361915.607, "dur": 4.084, "args": { "External id": 20731,"Record function id": 0, "Ev Idx": 3322 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361916.697, "dur": 2.595, "args": { "External id": 20732,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361917.316, "dur": 1.519, "args": { "External id": 20733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3324 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361917.878, "dur": 0.839, "args": { "External id": 20734,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3325 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361922.970, "dur": 3.503, "args": { "External id": 20735,"Record function id": 0, "Ev Idx": 3326 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361924.069, "dur": 1.985, "args": { "External id": 20736,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361924.570, "dur": 1.077, "args": { "External id": 20737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3328 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361924.836, "dur": 0.716, "args": { "External id": 20738,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3329 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361929.841, "dur": 3.537, "args": { "External id": 20739,"Record function id": 0, "Ev Idx": 3330 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361930.961, "dur": 2.020, "args": { "External id": 20740,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361931.438, "dur": 1.111, "args": { "External id": 20741,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3332 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361931.716, "dur": 0.766, "args": { "External id": 20742,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3333 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361940.474, "dur": 3.740, "args": { "External id": 20743,"Record function id": 0, "Ev Idx": 3334 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651361941.631, "dur": 2.165, "args": { "External id": 20744,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361942.092, "dur": 1.306, "args": { "External id": 20745,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3336 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651361942.480, "dur": 0.850, "args": { "External id": 20746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3337 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651361948.022, "dur": 37175.496, "args": { "External id": 20747,"Record function id": 0, "Sequence number": 246573, "Fwd thread id": 1, "Ev Idx": 3338 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651361949.075, "dur": 37165.813, "args": { "External id": 20748,"Sequence number": 246573, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3339 } }, { "ph": "f", "id": 195, "pid": 1336754, "tid": 1381179, "ts": 1295651361949.075, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651361977.439, "dur": 72.210, "args": { "External id": 20749,"Record function id": 0, "Ev Idx": 3340 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651362058.601, "dur": 63.811, "args": { "External id": 20750,"Record function id": 0, "Ev Idx": 3341 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.16)", "pid": 1336754, "tid": 1381179, "ts": 1295651362128.267, "dur": 36978.715, "args": { "External id": 20751,"Record function id": 0, "Ev Idx": 3342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651362216.409, "dur": 10.195, "args": { "External id": 20752,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651362253.333, "dur": 5.193, "args": { "External id": 20753,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3344 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651362274.067, "dur": 35949.104, "args": { "External id": 20754,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651362290.325, "dur": 35924.678, "args": { "External id": 20755,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651362344.464, "dur": 15.008, "args": { "External id": 20756,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651362365.670, "dur": 35810.536, "args": { "External id": 20757,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651362368.211, "dur": 35807.527, "args": { "External id": 20758,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651362372.150, "dur": 6.041, "args": { "External id": 20759,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651362380.124, "dur": 35792.085, "args": { "External id": 20760,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651398324.639, "dur": 8.884, "args": { "External id": 20761,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651398327.634, "dur": 5.418, "args": { "External id": 20762,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651398360.515, "dur": 413.285, "args": { "External id": 20763,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651398390.082, "dur": 378.961, "args": { "External id": 20764,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3355, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651398400.551, "dur": 363.167, "args": { "External id": 20765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651398798.900, "dur": 2.708, "args": { "External id": 20766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3357, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398857.856, "dur": 6.495, "args": { "External id": 20767,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398912.852, "dur": 1.540, "args": { "External id": 20768,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398929.966, "dur": 1.466, "args": { "External id": 20769,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398943.384, "dur": 1.060, "args": { "External id": 20770,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398958.550, "dur": 1.237, "args": { "External id": 20771,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651398969.188, "dur": 1.537, "args": { "External id": 20772,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399015.138, "dur": 2.238, "args": { "External id": 20773,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399033.107, "dur": 1.714, "args": { "External id": 20774,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399043.661, "dur": 1.727, "args": { "External id": 20775,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3366 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651399139.029, "dur": 2625.267, "args": { "External id": 20776,"Record function id": 0, "Ev Idx": 3367 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651399158.962, "dur": 986.900, "args": { "External id": 20777,"Record function id": 0, "Ev Idx": 3368 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651399174.871, "dur": 322.659, "args": { "External id": 20778,"Record function id": 0, "Ev Idx": 3369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399265.846, "dur": 4.968, "args": { "External id": 20779,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399274.279, "dur": 1.249, "args": { "External id": 20780,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399279.392, "dur": 1.453, "args": { "External id": 20781,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399282.086, "dur": 1.436, "args": { "External id": 20782,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399284.948, "dur": 1.860, "args": { "External id": 20783,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399288.163, "dur": 1.854, "args": { "External id": 20784,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399293.580, "dur": 1.363, "args": { "External id": 20785,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399296.357, "dur": 1.397, "args": { "External id": 20786,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399299.417, "dur": 1.584, "args": { "External id": 20787,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651399302.460, "dur": 1.222, "args": { "External id": 20788,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3379 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651399326.012, "dur": 142.778, "args": { "External id": 20789,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651399341.522, "dur": 122.788, "args": { "External id": 20790,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651399357.125, "dur": 12.400, "args": { "External id": 20791,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651399372.522, "dur": 63.580, "args": { "External id": 20792,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651399374.752, "dur": 61.026, "args": { "External id": 20793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399377.944, "dur": 5.105, "args": { "External id": 20794,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651399384.579, "dur": 50.775, "args": { "External id": 20795,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3386 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.14", "pid": 1336754, "tid": 1381179, "ts": 1295651399575.442, "dur": 562.744, "args": { "External id": 20796,"Record function id": 0, "Ev Idx": 3387 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651399591.428, "dur": 534.674, "args": { "External id": 20797,"Record function id": 0, "Ev Idx": 3388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651399643.667, "dur": 4.571, "args": { "External id": 20798,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651399663.311, "dur": 26.704, "args": { "External id": 20799,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399667.962, "dur": 1.717, "args": { "External id": 20800,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399671.060, "dur": 0.336, "args": { "External id": 20801,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399673.146, "dur": 0.303, "args": { "External id": 20802,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399674.899, "dur": 0.199, "args": { "External id": 20803,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399677.076, "dur": 0.500, "args": { "External id": 20804,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399678.971, "dur": 0.534, "args": { "External id": 20805,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399680.891, "dur": 0.922, "args": { "External id": 20806,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399683.338, "dur": 0.454, "args": { "External id": 20807,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399684.658, "dur": 1.032, "args": { "External id": 20808,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651399699.067, "dur": 31.133, "args": { "External id": 20809,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3400 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651399759.414, "dur": 96.445, "args": { "External id": 20810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651399768.193, "dur": 3.462, "args": { "External id": 20811,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651399776.193, "dur": 11.132, "args": { "External id": 20812,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651399780.126, "dur": 6.795, "args": { "External id": 20813,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399783.535, "dur": 1.328, "args": { "External id": 20814,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651399794.349, "dur": 26.457, "args": { "External id": 20815,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399795.862, "dur": 0.807, "args": { "External id": 20816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399798.436, "dur": 0.521, "args": { "External id": 20817,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399799.825, "dur": 1.037, "args": { "External id": 20818,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399802.069, "dur": 0.800, "args": { "External id": 20819,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399804.904, "dur": 0.436, "args": { "External id": 20820,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399806.630, "dur": 0.663, "args": { "External id": 20821,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399808.547, "dur": 0.459, "args": { "External id": 20822,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399810.198, "dur": 0.604, "args": { "External id": 20823,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651399812.125, "dur": 0.554, "args": { "External id": 20824,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651399829.639, "dur": 19.532, "args": { "External id": 20825,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3416 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651399896.070, "dur": 155.963, "args": { "External id": 20826,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3417 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651399922.510, "dur": 125.761, "args": { "External id": 20827,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3418, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651399930.928, "dur": 112.521, "args": { "External id": 20828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3419 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651400070.798, "dur": 2.463, "args": { "External id": 20829,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3420, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651400153.011, "dur": 1593.604, "args": { "External id": 20830,"Sequence number": 246572, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3421 } }, { "ph": "f", "id": 196, "pid": 1336754, "tid": 1381179, "ts": 1295651400153.011, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400273.531, "dur": 106.819, "args": { "External id": 20831,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3422 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651400419.954, "dur": 38.291, "args": { "External id": 20832,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651400473.942, "dur": 52.769, "args": { "External id": 20833,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400536.591, "dur": 36.601, "args": { "External id": 20834,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400579.912, "dur": 44.665, "args": { "External id": 20835,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400631.692, "dur": 28.353, "args": { "External id": 20836,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400666.822, "dur": 41.036, "args": { "External id": 20837,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3428 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651400731.730, "dur": 23.527, "args": { "External id": 20838,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3429 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651400773.213, "dur": 30.168, "args": { "External id": 20839,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3430 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651400825.311, "dur": 20.692, "args": { "External id": 20840,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3431 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651400858.224, "dur": 17.406, "args": { "External id": 20841,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400884.189, "dur": 30.977, "args": { "External id": 20842,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651400918.130, "dur": 33.100, "args": { "External id": 20843,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3434 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651400981.202, "dur": 205.129, "args": { "External id": 20844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651401094.855, "dur": 6.796, "args": { "External id": 20845,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651401103.533, "dur": 2.459, "args": { "External id": 20846,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3437 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651401216.550, "dur": 42.868, "args": { "External id": 20847,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3438 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651401272.654, "dur": 16.173, "args": { "External id": 20848,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401299.183, "dur": 43.077, "args": { "External id": 20849,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401348.341, "dur": 35.706, "args": { "External id": 20850,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401390.159, "dur": 21.959, "args": { "External id": 20851,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401416.478, "dur": 29.079, "args": { "External id": 20852,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401451.628, "dur": 21.236, "args": { "External id": 20853,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651401479.287, "dur": 28.274, "args": { "External id": 20854,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3445 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651401533.956, "dur": 30.494, "args": { "External id": 20855,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3446 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651401589.898, "dur": 28.518, "args": { "External id": 20856,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3447 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651401633.379, "dur": 17.784, "args": { "External id": 20857,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3448 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651401666.772, "dur": 19.651, "args": { "External id": 20858,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3449 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651401700.179, "dur": 16.579, "args": { "External id": 20859,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3450 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401786.091, "dur": 17.913, "args": { "External id": 20860,"Record function id": 0, "Ev Idx": 3451 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401792.010, "dur": 11.158, "args": { "External id": 20861,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401796.042, "dur": 6.332, "args": { "External id": 20862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3453 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401797.671, "dur": 4.605, "args": { "External id": 20863,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3454 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401808.049, "dur": 4.978, "args": { "External id": 20864,"Record function id": 0, "Ev Idx": 3455 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401809.494, "dur": 3.088, "args": { "External id": 20865,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401810.334, "dur": 1.701, "args": { "External id": 20866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3457 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401810.934, "dur": 1.035, "args": { "External id": 20867,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3458 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401816.519, "dur": 4.548, "args": { "External id": 20868,"Record function id": 0, "Ev Idx": 3459 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401817.751, "dur": 2.880, "args": { "External id": 20869,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401818.519, "dur": 1.634, "args": { "External id": 20870,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3461 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401819.191, "dur": 0.895, "args": { "External id": 20871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3462 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401824.395, "dur": 3.799, "args": { "External id": 20872,"Record function id": 0, "Ev Idx": 3463 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401825.432, "dur": 2.351, "args": { "External id": 20873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401825.971, "dur": 1.383, "args": { "External id": 20874,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3465 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401826.671, "dur": 0.607, "args": { "External id": 20875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3466 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401831.355, "dur": 4.134, "args": { "External id": 20876,"Record function id": 0, "Ev Idx": 3467 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401832.603, "dur": 2.459, "args": { "External id": 20877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401833.235, "dur": 1.407, "args": { "External id": 20878,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3469 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401833.876, "dur": 0.701, "args": { "External id": 20879,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3470 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401838.757, "dur": 4.541, "args": { "External id": 20880,"Record function id": 0, "Ev Idx": 3471 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401839.707, "dur": 3.155, "args": { "External id": 20881,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401840.647, "dur": 1.761, "args": { "External id": 20882,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3473 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401841.193, "dur": 1.147, "args": { "External id": 20883,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3474 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401846.664, "dur": 7.313, "args": { "External id": 20884,"Record function id": 0, "Ev Idx": 3475 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401851.111, "dur": 2.413, "args": { "External id": 20885,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401851.773, "dur": 1.280, "args": { "External id": 20886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3477 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401852.168, "dur": 0.803, "args": { "External id": 20887,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3478 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401857.110, "dur": 3.323, "args": { "External id": 20888,"Record function id": 0, "Ev Idx": 3479 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401857.979, "dur": 2.028, "args": { "External id": 20889,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401858.432, "dur": 1.127, "args": { "External id": 20890,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3481 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401858.706, "dur": 0.763, "args": { "External id": 20891,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3482 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401863.544, "dur": 3.851, "args": { "External id": 20892,"Record function id": 0, "Ev Idx": 3483 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651401864.787, "dur": 2.148, "args": { "External id": 20893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401865.230, "dur": 1.194, "args": { "External id": 20894,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3485 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651401865.486, "dur": 0.878, "args": { "External id": 20895,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3486 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651401871.035, "dur": 36672.950, "args": { "External id": 20896,"Record function id": 0, "Sequence number": 246571, "Fwd thread id": 1, "Ev Idx": 3487 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651401872.202, "dur": 36663.264, "args": { "External id": 20897,"Sequence number": 246571, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3488 } }, { "ph": "f", "id": 197, "pid": 1336754, "tid": 1381179, "ts": 1295651401872.202, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651401900.575, "dur": 39.768, "args": { "External id": 20898,"Record function id": 0, "Ev Idx": 3489 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651401948.125, "dur": 107.636, "args": { "External id": 20899,"Record function id": 0, "Ev Idx": 3490 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.15)", "pid": 1336754, "tid": 1381179, "ts": 1295651402063.797, "dur": 36463.847, "args": { "External id": 20900,"Record function id": 0, "Ev Idx": 3491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651402158.509, "dur": 7.626, "args": { "External id": 20901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651402175.833, "dur": 5.002, "args": { "External id": 20902,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3493 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651402196.692, "dur": 35493.549, "args": { "External id": 20903,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651402209.345, "dur": 35470.843, "args": { "External id": 20904,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651402272.039, "dur": 16.287, "args": { "External id": 20905,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651402294.468, "dur": 35340.217, "args": { "External id": 20906,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651402296.904, "dur": 35337.232, "args": { "External id": 20907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651402300.534, "dur": 5.992, "args": { "External id": 20908,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651402308.048, "dur": 35322.198, "args": { "External id": 20909,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651437785.642, "dur": 9.867, "args": { "External id": 20910,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651437789.115, "dur": 6.013, "args": { "External id": 20911,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651437824.689, "dur": 394.518, "args": { "External id": 20912,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651437856.070, "dur": 358.037, "args": { "External id": 20913,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3504, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651437867.391, "dur": 340.286, "args": { "External id": 20914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651438258.192, "dur": 3.346, "args": { "External id": 20915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3506, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438328.079, "dur": 6.916, "args": { "External id": 20916,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438378.962, "dur": 1.716, "args": { "External id": 20917,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438395.398, "dur": 1.620, "args": { "External id": 20918,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438409.734, "dur": 1.307, "args": { "External id": 20919,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438421.384, "dur": 0.869, "args": { "External id": 20920,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438431.674, "dur": 1.166, "args": { "External id": 20921,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438442.444, "dur": 1.280, "args": { "External id": 20922,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438454.113, "dur": 2.119, "args": { "External id": 20923,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438465.637, "dur": 1.917, "args": { "External id": 20924,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3515 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651438559.712, "dur": 2741.488, "args": { "External id": 20925,"Record function id": 0, "Ev Idx": 3516 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651438578.314, "dur": 996.248, "args": { "External id": 20926,"Record function id": 0, "Ev Idx": 3517 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651438594.100, "dur": 297.741, "args": { "External id": 20927,"Record function id": 0, "Ev Idx": 3518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438666.506, "dur": 4.175, "args": { "External id": 20928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438674.078, "dur": 1.261, "args": { "External id": 20929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438677.318, "dur": 1.254, "args": { "External id": 20930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438682.426, "dur": 1.387, "args": { "External id": 20931,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438685.352, "dur": 1.009, "args": { "External id": 20932,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438687.784, "dur": 0.987, "args": { "External id": 20933,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438690.040, "dur": 0.864, "args": { "External id": 20934,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438694.511, "dur": 0.980, "args": { "External id": 20935,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438697.112, "dur": 1.223, "args": { "External id": 20936,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651438699.804, "dur": 0.836, "args": { "External id": 20937,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3528 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651438717.729, "dur": 147.853, "args": { "External id": 20938,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651438734.484, "dur": 126.684, "args": { "External id": 20939,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651438751.808, "dur": 12.276, "args": { "External id": 20940,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651438766.725, "dur": 66.792, "args": { "External id": 20941,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651438769.152, "dur": 64.051, "args": { "External id": 20942,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651438772.916, "dur": 5.014, "args": { "External id": 20943,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651438779.653, "dur": 52.882, "args": { "External id": 20944,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3535 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.13", "pid": 1336754, "tid": 1381179, "ts": 1295651438966.390, "dur": 600.376, "args": { "External id": 20945,"Record function id": 0, "Ev Idx": 3536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651439022.390, "dur": 532.450, "args": { "External id": 20946,"Record function id": 0, "Ev Idx": 3537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651439080.626, "dur": 6.791, "args": { "External id": 20947,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651439103.587, "dur": 26.865, "args": { "External id": 20948,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439108.374, "dur": 1.549, "args": { "External id": 20949,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439112.061, "dur": 0.270, "args": { "External id": 20950,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439113.600, "dur": 0.260, "args": { "External id": 20951,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439115.247, "dur": 0.800, "args": { "External id": 20952,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439117.232, "dur": 0.687, "args": { "External id": 20953,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439119.147, "dur": 0.489, "args": { "External id": 20954,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439121.035, "dur": 0.832, "args": { "External id": 20955,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439123.479, "dur": 0.696, "args": { "External id": 20956,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439125.513, "dur": 0.527, "args": { "External id": 20957,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651439139.992, "dur": 35.020, "args": { "External id": 20958,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3549 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651439205.036, "dur": 123.334, "args": { "External id": 20959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651439214.188, "dur": 3.433, "args": { "External id": 20960,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651439224.958, "dur": 27.027, "args": { "External id": 20961,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651439244.578, "dur": 6.959, "args": { "External id": 20962,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439248.009, "dur": 1.354, "args": { "External id": 20963,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651439263.304, "dur": 24.678, "args": { "External id": 20964,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439265.145, "dur": 0.663, "args": { "External id": 20965,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439267.352, "dur": 0.733, "args": { "External id": 20966,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439269.072, "dur": 0.902, "args": { "External id": 20967,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439271.446, "dur": 0.709, "args": { "External id": 20968,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439273.608, "dur": 1.147, "args": { "External id": 20969,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439275.780, "dur": 0.629, "args": { "External id": 20970,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439277.479, "dur": 0.583, "args": { "External id": 20971,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439278.771, "dur": 0.542, "args": { "External id": 20972,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651439280.268, "dur": 0.684, "args": { "External id": 20973,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651439298.433, "dur": 22.102, "args": { "External id": 20974,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3565 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651439373.019, "dur": 114.231, "args": { "External id": 20975,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3566 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651439399.143, "dur": 84.983, "args": { "External id": 20976,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3567, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651439408.356, "dur": 71.557, "args": { "External id": 20977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3568 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651439503.112, "dur": 2.194, "args": { "External id": 20978,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3569, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651439582.574, "dur": 1698.982, "args": { "External id": 20979,"Sequence number": 246570, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3570 } }, { "ph": "f", "id": 198, "pid": 1336754, "tid": 1381179, "ts": 1295651439582.574, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651439686.887, "dur": 102.637, "args": { "External id": 20980,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3571 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651439828.033, "dur": 42.334, "args": { "External id": 20981,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651439885.699, "dur": 52.347, "args": { "External id": 20982,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651439947.983, "dur": 71.283, "args": { "External id": 20983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440030.962, "dur": 49.954, "args": { "External id": 20984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440088.912, "dur": 28.218, "args": { "External id": 20985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440124.546, "dur": 41.828, "args": { "External id": 20986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3577 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651440192.680, "dur": 24.175, "args": { "External id": 20987,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3578 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651440252.157, "dur": 32.239, "args": { "External id": 20988,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3579 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651440306.443, "dur": 21.097, "args": { "External id": 20989,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3580 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651440339.857, "dur": 16.399, "args": { "External id": 20990,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440365.310, "dur": 34.672, "args": { "External id": 20991,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440403.454, "dur": 33.240, "args": { "External id": 20992,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3583 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651440486.670, "dur": 167.628, "args": { "External id": 20993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651440565.890, "dur": 5.625, "args": { "External id": 20994,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651440573.255, "dur": 2.383, "args": { "External id": 20995,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3586 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651440683.623, "dur": 27.308, "args": { "External id": 20996,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3587 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651440721.682, "dur": 14.936, "args": { "External id": 20997,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440747.551, "dur": 37.578, "args": { "External id": 20998,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440792.309, "dur": 39.328, "args": { "External id": 20999,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440838.810, "dur": 24.601, "args": { "External id": 21000,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440867.886, "dur": 28.957, "args": { "External id": 21001,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440902.389, "dur": 21.131, "args": { "External id": 21002,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651440930.081, "dur": 28.874, "args": { "External id": 21003,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3594 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651441017.540, "dur": 32.888, "args": { "External id": 21004,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3595 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651441096.642, "dur": 32.253, "args": { "External id": 21005,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3596 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651441149.577, "dur": 18.816, "args": { "External id": 21006,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3597 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651441186.011, "dur": 15.274, "args": { "External id": 21007,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3598 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651441216.881, "dur": 30.946, "args": { "External id": 21008,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3599 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441327.051, "dur": 14.636, "args": { "External id": 21009,"Record function id": 0, "Ev Idx": 3600 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441330.035, "dur": 10.752, "args": { "External id": 21010,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441333.888, "dur": 6.089, "args": { "External id": 21011,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3602 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441335.542, "dur": 4.326, "args": { "External id": 21012,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3603 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441345.685, "dur": 4.840, "args": { "External id": 21013,"Record function id": 0, "Ev Idx": 3604 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441346.988, "dur": 3.119, "args": { "External id": 21014,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441347.800, "dur": 1.774, "args": { "External id": 21015,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3606 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441348.451, "dur": 1.011, "args": { "External id": 21016,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3607 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441353.784, "dur": 4.501, "args": { "External id": 21017,"Record function id": 0, "Ev Idx": 3608 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441355.181, "dur": 2.652, "args": { "External id": 21018,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441355.792, "dur": 1.623, "args": { "External id": 21019,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3610 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441356.483, "dur": 0.743, "args": { "External id": 21020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3611 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441361.518, "dur": 3.594, "args": { "External id": 21021,"Record function id": 0, "Ev Idx": 3612 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441362.455, "dur": 2.226, "args": { "External id": 21022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441363.117, "dur": 1.134, "args": { "External id": 21023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3614 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441363.395, "dur": 0.780, "args": { "External id": 21024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3615 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441368.213, "dur": 4.140, "args": { "External id": 21025,"Record function id": 0, "Ev Idx": 3616 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441369.468, "dur": 2.458, "args": { "External id": 21026,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441369.951, "dur": 1.525, "args": { "External id": 21027,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3618 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441370.533, "dur": 0.876, "args": { "External id": 21028,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3619 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441375.393, "dur": 6.254, "args": { "External id": 21029,"Record function id": 0, "Ev Idx": 3620 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441379.312, "dur": 1.927, "args": { "External id": 21030,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441379.770, "dur": 1.046, "args": { "External id": 21031,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3622 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441380.179, "dur": 0.573, "args": { "External id": 21032,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3623 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441384.798, "dur": 3.423, "args": { "External id": 21033,"Record function id": 0, "Ev Idx": 3624 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441385.911, "dur": 1.901, "args": { "External id": 21034,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441386.339, "dur": 1.009, "args": { "External id": 21035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3626 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441386.611, "dur": 0.672, "args": { "External id": 21036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3627 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441391.479, "dur": 5.865, "args": { "External id": 21037,"Record function id": 0, "Ev Idx": 3628 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441392.639, "dur": 4.315, "args": { "External id": 21038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441393.240, "dur": 3.275, "args": { "External id": 21039,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3630 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441395.531, "dur": 0.883, "args": { "External id": 21040,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3631 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441400.406, "dur": 3.485, "args": { "External id": 21041,"Record function id": 0, "Ev Idx": 3632 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651441401.362, "dur": 2.102, "args": { "External id": 21042,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441401.806, "dur": 1.233, "args": { "External id": 21043,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3634 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651441402.075, "dur": 0.883, "args": { "External id": 21044,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3635 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651441407.678, "dur": 36769.436, "args": { "External id": 21045,"Record function id": 0, "Sequence number": 246569, "Fwd thread id": 1, "Ev Idx": 3636 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651441408.890, "dur": 36759.764, "args": { "External id": 21046,"Sequence number": 246569, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3637 } }, { "ph": "f", "id": 199, "pid": 1336754, "tid": 1381179, "ts": 1295651441408.890, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651441437.883, "dur": 37.984, "args": { "External id": 21047,"Record function id": 0, "Ev Idx": 3638 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651441483.250, "dur": 61.601, "args": { "External id": 21048,"Record function id": 0, "Ev Idx": 3639 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.14)", "pid": 1336754, "tid": 1381179, "ts": 1295651441550.763, "dur": 36609.717, "args": { "External id": 21049,"Record function id": 0, "Ev Idx": 3640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651441636.067, "dur": 6.845, "args": { "External id": 21050,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651441651.862, "dur": 4.516, "args": { "External id": 21051,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3642 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651441671.116, "dur": 35691.252, "args": { "External id": 21052,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651441686.787, "dur": 35667.037, "args": { "External id": 21053,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651441728.873, "dur": 14.276, "args": { "External id": 21054,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651441749.249, "dur": 35566.706, "args": { "External id": 21055,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651441751.697, "dur": 35563.672, "args": { "External id": 21056,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651441754.999, "dur": 5.252, "args": { "External id": 21057,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651441762.050, "dur": 35549.772, "args": { "External id": 21058,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651477455.730, "dur": 8.574, "args": { "External id": 21059,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651477458.498, "dur": 5.467, "args": { "External id": 21060,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3651 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651477491.815, "dur": 344.610, "args": { "External id": 21061,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3652 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651477525.002, "dur": 307.034, "args": { "External id": 21062,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3653, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651477536.348, "dur": 290.363, "args": { "External id": 21063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3654 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651477854.855, "dur": 2.091, "args": { "External id": 21064,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3655, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651477910.245, "dur": 6.638, "args": { "External id": 21065,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651477960.039, "dur": 1.906, "args": { "External id": 21066,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651477977.139, "dur": 1.336, "args": { "External id": 21067,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478041.600, "dur": 1.645, "args": { "External id": 21068,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478054.669, "dur": 0.993, "args": { "External id": 21069,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478064.658, "dur": 1.122, "args": { "External id": 21070,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478075.645, "dur": 1.152, "args": { "External id": 21071,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478087.960, "dur": 1.676, "args": { "External id": 21072,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478101.354, "dur": 0.979, "args": { "External id": 21073,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3664 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651478192.393, "dur": 2639.734, "args": { "External id": 21074,"Record function id": 0, "Ev Idx": 3665 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651478211.347, "dur": 989.925, "args": { "External id": 21075,"Record function id": 0, "Ev Idx": 3666 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651478224.623, "dur": 323.866, "args": { "External id": 21076,"Record function id": 0, "Ev Idx": 3667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478317.640, "dur": 5.190, "args": { "External id": 21077,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478326.207, "dur": 1.092, "args": { "External id": 21078,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478329.064, "dur": 1.186, "args": { "External id": 21079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478331.900, "dur": 1.336, "args": { "External id": 21080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478334.731, "dur": 1.239, "args": { "External id": 21081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478337.278, "dur": 1.267, "args": { "External id": 21082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478342.516, "dur": 1.189, "args": { "External id": 21083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478345.033, "dur": 1.337, "args": { "External id": 21084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478347.683, "dur": 1.222, "args": { "External id": 21085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651478350.306, "dur": 1.510, "args": { "External id": 21086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3677 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651478371.295, "dur": 148.462, "args": { "External id": 21087,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651478389.521, "dur": 125.437, "args": { "External id": 21088,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651478405.173, "dur": 12.353, "args": { "External id": 21089,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651478420.532, "dur": 66.652, "args": { "External id": 21090,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651478423.147, "dur": 63.698, "args": { "External id": 21091,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478426.737, "dur": 5.819, "args": { "External id": 21092,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651478434.342, "dur": 51.851, "args": { "External id": 21093,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3684 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.12", "pid": 1336754, "tid": 1381179, "ts": 1295651478623.761, "dur": 570.274, "args": { "External id": 21094,"Record function id": 0, "Ev Idx": 3685 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651478638.658, "dur": 543.178, "args": { "External id": 21095,"Record function id": 0, "Ev Idx": 3686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651478695.791, "dur": 4.342, "args": { "External id": 21096,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651478715.729, "dur": 23.927, "args": { "External id": 21097,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478720.918, "dur": 1.417, "args": { "External id": 21098,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478724.208, "dur": 0.526, "args": { "External id": 21099,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478726.086, "dur": 0.406, "args": { "External id": 21100,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478727.384, "dur": 0.184, "args": { "External id": 21101,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478728.946, "dur": 0.494, "args": { "External id": 21102,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478730.540, "dur": 0.712, "args": { "External id": 21103,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478732.428, "dur": 0.663, "args": { "External id": 21104,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478734.340, "dur": 0.970, "args": { "External id": 21105,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478736.239, "dur": 0.516, "args": { "External id": 21106,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651478749.754, "dur": 28.469, "args": { "External id": 21107,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3698 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651478807.852, "dur": 93.827, "args": { "External id": 21108,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651478817.178, "dur": 3.308, "args": { "External id": 21109,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651478825.567, "dur": 9.689, "args": { "External id": 21110,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651478829.256, "dur": 5.560, "args": { "External id": 21111,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478832.380, "dur": 0.602, "args": { "External id": 21112,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651478841.955, "dur": 24.243, "args": { "External id": 21113,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478843.436, "dur": 1.045, "args": { "External id": 21114,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478845.796, "dur": 0.571, "args": { "External id": 21115,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478847.865, "dur": 0.651, "args": { "External id": 21116,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478849.875, "dur": 0.509, "args": { "External id": 21117,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478851.553, "dur": 0.734, "args": { "External id": 21118,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478853.525, "dur": 0.469, "args": { "External id": 21119,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478855.358, "dur": 0.446, "args": { "External id": 21120,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478856.796, "dur": 0.800, "args": { "External id": 21121,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651478859.074, "dur": 0.442, "args": { "External id": 21122,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651478876.550, "dur": 18.249, "args": { "External id": 21123,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3714 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651478946.447, "dur": 154.801, "args": { "External id": 21124,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3715 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651478970.649, "dur": 126.769, "args": { "External id": 21125,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3716, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651478979.481, "dur": 111.513, "args": { "External id": 21126,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3717 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651479122.055, "dur": 2.161, "args": { "External id": 21127,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3718, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651479207.943, "dur": 1604.798, "args": { "External id": 21128,"Sequence number": 246568, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3719 } }, { "ph": "f", "id": 200, "pid": 1336754, "tid": 1381179, "ts": 1295651479207.943, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479333.921, "dur": 104.232, "args": { "External id": 21129,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651479476.166, "dur": 37.431, "args": { "External id": 21130,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651479528.739, "dur": 47.744, "args": { "External id": 21131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479585.802, "dur": 32.119, "args": { "External id": 21132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479625.309, "dur": 43.639, "args": { "External id": 21133,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479675.868, "dur": 27.762, "args": { "External id": 21134,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479710.794, "dur": 40.670, "args": { "External id": 21135,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3726 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651479775.805, "dur": 21.959, "args": { "External id": 21136,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3727 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651479815.943, "dur": 27.300, "args": { "External id": 21137,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3728 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651479863.600, "dur": 20.859, "args": { "External id": 21138,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3729 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651479894.556, "dur": 16.785, "args": { "External id": 21139,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479920.501, "dur": 29.551, "args": { "External id": 21140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651479953.231, "dur": 71.052, "args": { "External id": 21141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3732 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651480054.788, "dur": 196.989, "args": { "External id": 21142,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651480137.696, "dur": 6.570, "args": { "External id": 21143,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651480146.298, "dur": 2.738, "args": { "External id": 21144,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3735 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651480284.441, "dur": 32.564, "args": { "External id": 21145,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3736 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651480330.961, "dur": 18.315, "args": { "External id": 21146,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480358.035, "dur": 42.449, "args": { "External id": 21147,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480409.867, "dur": 34.253, "args": { "External id": 21148,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480451.260, "dur": 24.936, "args": { "External id": 21149,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480480.443, "dur": 29.984, "args": { "External id": 21150,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480516.454, "dur": 24.552, "args": { "External id": 21151,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651480547.690, "dur": 28.778, "args": { "External id": 21152,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3743 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651480598.287, "dur": 23.184, "args": { "External id": 21153,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3744 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651480649.570, "dur": 31.472, "args": { "External id": 21154,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3745 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651480701.713, "dur": 18.119, "args": { "External id": 21155,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3746 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651480737.760, "dur": 18.253, "args": { "External id": 21156,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3747 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651480768.015, "dur": 15.622, "args": { "External id": 21157,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3748 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480853.710, "dur": 14.611, "args": { "External id": 21158,"Record function id": 0, "Ev Idx": 3749 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480856.617, "dur": 10.747, "args": { "External id": 21159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480860.727, "dur": 5.747, "args": { "External id": 21160,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3751 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480862.126, "dur": 4.230, "args": { "External id": 21161,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3752 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480872.224, "dur": 4.063, "args": { "External id": 21162,"Record function id": 0, "Ev Idx": 3753 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480873.487, "dur": 2.355, "args": { "External id": 21163,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480874.167, "dur": 1.220, "args": { "External id": 21164,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3755 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480874.612, "dur": 0.701, "args": { "External id": 21165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3756 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480879.557, "dur": 4.443, "args": { "External id": 21166,"Record function id": 0, "Ev Idx": 3757 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480880.586, "dur": 3.006, "args": { "External id": 21167,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480881.227, "dur": 1.961, "args": { "External id": 21168,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3759 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480882.093, "dur": 0.980, "args": { "External id": 21169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3760 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480887.219, "dur": 4.072, "args": { "External id": 21170,"Record function id": 0, "Ev Idx": 3761 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480888.786, "dur": 2.095, "args": { "External id": 21171,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480889.379, "dur": 1.011, "args": { "External id": 21172,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3763 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480889.668, "dur": 0.656, "args": { "External id": 21173,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3764 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480894.464, "dur": 4.002, "args": { "External id": 21174,"Record function id": 0, "Ev Idx": 3765 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480895.714, "dur": 2.343, "args": { "External id": 21175,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480896.167, "dur": 1.429, "args": { "External id": 21176,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3767 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480896.572, "dur": 0.956, "args": { "External id": 21177,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3768 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480901.599, "dur": 3.415, "args": { "External id": 21178,"Record function id": 0, "Ev Idx": 3769 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480902.629, "dur": 1.985, "args": { "External id": 21179,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480903.086, "dur": 1.101, "args": { "External id": 21180,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3771 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480903.421, "dur": 0.700, "args": { "External id": 21181,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3772 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480908.279, "dur": 5.207, "args": { "External id": 21182,"Record function id": 0, "Ev Idx": 3773 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480909.132, "dur": 3.917, "args": { "External id": 21183,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480909.612, "dur": 2.984, "args": { "External id": 21184,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3775 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480911.811, "dur": 0.720, "args": { "External id": 21185,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3776 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480916.653, "dur": 3.828, "args": { "External id": 21186,"Record function id": 0, "Ev Idx": 3777 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480917.739, "dur": 2.305, "args": { "External id": 21187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480918.445, "dur": 1.180, "args": { "External id": 21188,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3779 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480918.860, "dur": 0.698, "args": { "External id": 21189,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3780 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480923.584, "dur": 3.771, "args": { "External id": 21190,"Record function id": 0, "Ev Idx": 3781 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651480924.669, "dur": 2.269, "args": { "External id": 21191,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480925.108, "dur": 1.409, "args": { "External id": 21192,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3783 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651480925.546, "dur": 0.903, "args": { "External id": 21193,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3784 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651480931.592, "dur": 38139.577, "args": { "External id": 21194,"Record function id": 0, "Sequence number": 246567, "Fwd thread id": 1, "Ev Idx": 3785 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651480932.712, "dur": 38129.052, "args": { "External id": 21195,"Sequence number": 246567, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3786 } }, { "ph": "f", "id": 201, "pid": 1336754, "tid": 1381179, "ts": 1295651480932.712, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651480960.806, "dur": 73.738, "args": { "External id": 21196,"Record function id": 0, "Ev Idx": 3787 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651481043.937, "dur": 65.617, "args": { "External id": 21197,"Record function id": 0, "Ev Idx": 3788 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.13)", "pid": 1336754, "tid": 1381179, "ts": 1295651481118.047, "dur": 37935.619, "args": { "External id": 21198,"Record function id": 0, "Ev Idx": 3789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651481203.394, "dur": 7.154, "args": { "External id": 21199,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651481220.793, "dur": 5.042, "args": { "External id": 21200,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3791 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651481256.533, "dur": 36920.189, "args": { "External id": 21201,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651481270.489, "dur": 36897.427, "args": { "External id": 21202,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651481312.383, "dur": 15.079, "args": { "External id": 21203,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651481333.797, "dur": 36793.980, "args": { "External id": 21204,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651481336.601, "dur": 36790.584, "args": { "External id": 21205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651481340.363, "dur": 6.297, "args": { "External id": 21206,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651481348.238, "dur": 36775.489, "args": { "External id": 21207,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651518288.192, "dur": 11.788, "args": { "External id": 21208,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651518290.892, "dur": 8.574, "args": { "External id": 21209,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3800 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651518327.271, "dur": 404.978, "args": { "External id": 21210,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3801 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651518356.999, "dur": 370.233, "args": { "External id": 21211,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3802, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651518367.953, "dur": 352.492, "args": { "External id": 21212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3803 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651518755.971, "dur": 2.222, "args": { "External id": 21213,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3804, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518818.656, "dur": 6.623, "args": { "External id": 21214,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518870.211, "dur": 1.743, "args": { "External id": 21215,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518887.541, "dur": 1.353, "args": { "External id": 21216,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518900.061, "dur": 1.191, "args": { "External id": 21217,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518911.742, "dur": 1.264, "args": { "External id": 21218,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518922.108, "dur": 1.257, "args": { "External id": 21219,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518933.698, "dur": 0.903, "args": { "External id": 21220,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518945.690, "dur": 1.158, "args": { "External id": 21221,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651518958.822, "dur": 1.019, "args": { "External id": 21222,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3813 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651519087.002, "dur": 2632.852, "args": { "External id": 21223,"Record function id": 0, "Ev Idx": 3814 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651519106.689, "dur": 977.879, "args": { "External id": 21224,"Record function id": 0, "Ev Idx": 3815 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651519121.221, "dur": 323.422, "args": { "External id": 21225,"Record function id": 0, "Ev Idx": 3816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519196.628, "dur": 5.076, "args": { "External id": 21226,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519205.248, "dur": 1.266, "args": { "External id": 21227,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519208.493, "dur": 0.998, "args": { "External id": 21228,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519211.486, "dur": 1.280, "args": { "External id": 21229,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519214.134, "dur": 1.269, "args": { "External id": 21230,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519216.710, "dur": 1.509, "args": { "External id": 21231,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519221.836, "dur": 1.473, "args": { "External id": 21232,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519224.727, "dur": 1.074, "args": { "External id": 21233,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519227.056, "dur": 15.970, "args": { "External id": 21234,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651519246.849, "dur": 2.318, "args": { "External id": 21235,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3826 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651519269.064, "dur": 147.465, "args": { "External id": 21236,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651519284.734, "dur": 127.262, "args": { "External id": 21237,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651519300.535, "dur": 12.228, "args": { "External id": 21238,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651519315.485, "dur": 68.108, "args": { "External id": 21239,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651519318.001, "dur": 65.206, "args": { "External id": 21240,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519322.298, "dur": 6.227, "args": { "External id": 21241,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651519330.433, "dur": 52.088, "args": { "External id": 21242,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3833 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.11", "pid": 1336754, "tid": 1381179, "ts": 1295651519523.627, "dur": 553.912, "args": { "External id": 21243,"Record function id": 0, "Ev Idx": 3834 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651519539.529, "dur": 524.332, "args": { "External id": 21244,"Record function id": 0, "Ev Idx": 3835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651519592.921, "dur": 4.285, "args": { "External id": 21245,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651519613.176, "dur": 24.268, "args": { "External id": 21246,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519617.790, "dur": 1.376, "args": { "External id": 21247,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519621.224, "dur": 0.270, "args": { "External id": 21248,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519623.243, "dur": 0.241, "args": { "External id": 21249,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519624.420, "dur": 1.523, "args": { "External id": 21250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519627.146, "dur": 0.622, "args": { "External id": 21251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519629.197, "dur": 0.624, "args": { "External id": 21252,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519630.650, "dur": 0.556, "args": { "External id": 21253,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519632.080, "dur": 0.774, "args": { "External id": 21254,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519634.202, "dur": 0.288, "args": { "External id": 21255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651519645.989, "dur": 31.202, "args": { "External id": 21256,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651519706.206, "dur": 88.709, "args": { "External id": 21257,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651519714.822, "dur": 3.093, "args": { "External id": 21258,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651519722.520, "dur": 9.821, "args": { "External id": 21259,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651519726.518, "dur": 5.392, "args": { "External id": 21260,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 3851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519729.964, "dur": 0.339, "args": { "External id": 21261,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651519738.593, "dur": 23.052, "args": { "External id": 21262,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519740.097, "dur": 0.576, "args": { "External id": 21263,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519742.037, "dur": 0.287, "args": { "External id": 21264,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519743.795, "dur": 0.547, "args": { "External id": 21265,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519745.482, "dur": 0.619, "args": { "External id": 21266,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519747.266, "dur": 0.463, "args": { "External id": 21267,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519748.917, "dur": 1.045, "args": { "External id": 21268,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519750.931, "dur": 0.992, "args": { "External id": 21269,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519753.018, "dur": 0.419, "args": { "External id": 21270,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651519754.713, "dur": 0.281, "args": { "External id": 21271,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651519770.130, "dur": 18.343, "args": { "External id": 21272,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3863 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651519840.389, "dur": 110.563, "args": { "External id": 21273,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 3864 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651519863.862, "dur": 84.121, "args": { "External id": 21274,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3865, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651519871.714, "dur": 72.206, "args": { "External id": 21275,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 3866 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651519966.544, "dur": 1.756, "args": { "External id": 21276,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3867, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651520092.213, "dur": 1608.046, "args": { "External id": 21277,"Sequence number": 246566, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3868 } }, { "ph": "f", "id": 202, "pid": 1336754, "tid": 1381179, "ts": 1295651520092.213, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520199.094, "dur": 120.518, "args": { "External id": 21278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 3869 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651520361.922, "dur": 41.709, "args": { "External id": 21279,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 3870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651520419.120, "dur": 51.765, "args": { "External id": 21280,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 3871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520481.633, "dur": 33.880, "args": { "External id": 21281,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520521.541, "dur": 44.169, "args": { "External id": 21282,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520572.684, "dur": 27.835, "args": { "External id": 21283,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 3874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520607.723, "dur": 41.467, "args": { "External id": 21284,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 3875 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651520675.711, "dur": 23.020, "args": { "External id": 21285,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 3876 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651520718.173, "dur": 29.752, "args": { "External id": 21286,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3877 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651520767.907, "dur": 19.064, "args": { "External id": 21287,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651520799.758, "dur": 15.184, "args": { "External id": 21288,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520823.428, "dur": 31.327, "args": { "External id": 21289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651520858.181, "dur": 32.328, "args": { "External id": 21290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3881 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651520916.402, "dur": 208.165, "args": { "External id": 21291,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 3882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651521029.854, "dur": 6.579, "args": { "External id": 21292,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651521038.788, "dur": 2.100, "args": { "External id": 21293,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3884 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651521155.293, "dur": 28.956, "args": { "External id": 21294,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3885 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651521194.747, "dur": 14.013, "args": { "External id": 21295,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521216.727, "dur": 66.609, "args": { "External id": 21296,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521291.534, "dur": 36.631, "args": { "External id": 21297,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521335.308, "dur": 25.332, "args": { "External id": 21298,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521365.092, "dur": 28.444, "args": { "External id": 21299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521399.705, "dur": 21.433, "args": { "External id": 21300,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 3891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651521427.719, "dur": 29.198, "args": { "External id": 21301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 3892 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651521479.439, "dur": 22.987, "args": { "External id": 21302,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 3893 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651521525.816, "dur": 39.061, "args": { "External id": 21303,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 3894 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651521589.401, "dur": 19.776, "args": { "External id": 21304,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 3895 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651521623.710, "dur": 17.291, "args": { "External id": 21305,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 3896 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651521654.956, "dur": 15.872, "args": { "External id": 21306,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 3897 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521741.584, "dur": 17.992, "args": { "External id": 21307,"Record function id": 0, "Ev Idx": 3898 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521744.664, "dur": 13.927, "args": { "External id": 21308,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521748.683, "dur": 9.175, "args": { "External id": 21309,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3900 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521750.128, "dur": 7.614, "args": { "External id": 21310,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3901 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521763.565, "dur": 4.377, "args": { "External id": 21311,"Record function id": 0, "Ev Idx": 3902 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521764.752, "dur": 2.751, "args": { "External id": 21312,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521765.730, "dur": 1.342, "args": { "External id": 21313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3904 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521766.225, "dur": 0.749, "args": { "External id": 21314,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3905 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521771.349, "dur": 4.597, "args": { "External id": 21315,"Record function id": 0, "Ev Idx": 3906 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521772.691, "dur": 2.791, "args": { "External id": 21316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521773.276, "dur": 1.786, "args": { "External id": 21317,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3908 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521774.114, "dur": 0.839, "args": { "External id": 21318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 3909 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521779.182, "dur": 3.678, "args": { "External id": 21319,"Record function id": 0, "Ev Idx": 3910 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521780.124, "dur": 2.321, "args": { "External id": 21320,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521780.779, "dur": 1.226, "args": { "External id": 21321,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3912 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521781.103, "dur": 0.804, "args": { "External id": 21322,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 3913 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521785.980, "dur": 4.148, "args": { "External id": 21323,"Record function id": 0, "Ev Idx": 3914 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521787.178, "dur": 2.529, "args": { "External id": 21324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521788.028, "dur": 1.227, "args": { "External id": 21325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3916 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521788.651, "dur": 0.511, "args": { "External id": 21326,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3917 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521793.387, "dur": 3.940, "args": { "External id": 21327,"Record function id": 0, "Ev Idx": 3918 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521794.389, "dur": 2.506, "args": { "External id": 21328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521795.065, "dur": 1.391, "args": { "External id": 21329,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3920 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521795.489, "dur": 0.901, "args": { "External id": 21330,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3921 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521800.498, "dur": 3.719, "args": { "External id": 21331,"Record function id": 0, "Ev Idx": 3922 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521801.814, "dur": 1.991, "args": { "External id": 21332,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521802.365, "dur": 1.029, "args": { "External id": 21333,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3924 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521802.629, "dur": 0.700, "args": { "External id": 21334,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3925 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521807.367, "dur": 8.324, "args": { "External id": 21335,"Record function id": 0, "Ev Idx": 3926 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521808.480, "dur": 6.757, "args": { "External id": 21336,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521809.173, "dur": 5.656, "args": { "External id": 21337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3928 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521814.095, "dur": 0.618, "args": { "External id": 21338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 3929 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521818.715, "dur": 6.127, "args": { "External id": 21339,"Record function id": 0, "Ev Idx": 3930 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651521819.772, "dur": 4.657, "args": { "External id": 21340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521820.244, "dur": 3.750, "args": { "External id": 21341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3932 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651521823.150, "dur": 0.763, "args": { "External id": 21342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 3933 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651521828.676, "dur": 36433.538, "args": { "External id": 21343,"Record function id": 0, "Sequence number": 246565, "Fwd thread id": 1, "Ev Idx": 3934 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651521829.786, "dur": 36418.643, "args": { "External id": 21344,"Sequence number": 246565, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 3935 } }, { "ph": "f", "id": 203, "pid": 1336754, "tid": 1381179, "ts": 1295651521829.786, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651521858.817, "dur": 39.700, "args": { "External id": 21345,"Record function id": 0, "Ev Idx": 3936 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651521905.742, "dur": 62.439, "args": { "External id": 21346,"Record function id": 0, "Ev Idx": 3937 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.12)", "pid": 1336754, "tid": 1381179, "ts": 1295651521974.304, "dur": 36248.411, "args": { "External id": 21347,"Record function id": 0, "Ev Idx": 3938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651522100.769, "dur": 7.640, "args": { "External id": 21348,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651522118.789, "dur": 4.852, "args": { "External id": 21349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3940 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651522140.482, "dur": 35042.302, "args": { "External id": 21350,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651522154.124, "dur": 35009.676, "args": { "External id": 21351,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 3942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651522193.375, "dur": 14.202, "args": { "External id": 21352,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651522213.973, "dur": 34885.693, "args": { "External id": 21353,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 3944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651522216.587, "dur": 34881.619, "args": { "External id": 21354,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 3945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651522220.672, "dur": 4.791, "args": { "External id": 21355,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651522227.009, "dur": 34860.116, "args": { "External id": 21356,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 3947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651557357.386, "dur": 15.477, "args": { "External id": 21357,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 3948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651557361.874, "dur": 10.450, "args": { "External id": 21358,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3949 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651557415.379, "dur": 389.850, "args": { "External id": 21359,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 3950 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651557453.736, "dur": 346.498, "args": { "External id": 21360,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 3951, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651557468.499, "dur": 325.831, "args": { "External id": 21361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 3952 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651557829.861, "dur": 2.472, "args": { "External id": 21362,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 3953, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651557895.121, "dur": 7.346, "args": { "External id": 21363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651557966.781, "dur": 1.795, "args": { "External id": 21364,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558046.355, "dur": 2.816, "args": { "External id": 21365,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558065.550, "dur": 1.545, "args": { "External id": 21366,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558081.521, "dur": 1.909, "args": { "External id": 21367,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558097.043, "dur": 1.268, "args": { "External id": 21368,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558109.306, "dur": 1.586, "args": { "External id": 21369,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558123.428, "dur": 1.226, "args": { "External id": 21370,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558135.911, "dur": 1.524, "args": { "External id": 21371,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3962 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651558283.731, "dur": 3034.944, "args": { "External id": 21372,"Record function id": 0, "Ev Idx": 3963 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651558313.379, "dur": 1162.608, "args": { "External id": 21373,"Record function id": 0, "Ev Idx": 3964 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651558332.744, "dur": 370.900, "args": { "External id": 21374,"Record function id": 0, "Ev Idx": 3965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558436.403, "dur": 5.313, "args": { "External id": 21375,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 3966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558447.657, "dur": 1.594, "args": { "External id": 21376,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558451.418, "dur": 1.677, "args": { "External id": 21377,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558454.643, "dur": 1.382, "args": { "External id": 21378,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558457.496, "dur": 2.067, "args": { "External id": 21379,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558463.376, "dur": 1.366, "args": { "External id": 21380,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 3971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558466.407, "dur": 1.129, "args": { "External id": 21381,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 3972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558468.775, "dur": 1.057, "args": { "External id": 21382,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558471.484, "dur": 1.251, "args": { "External id": 21383,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651558476.835, "dur": 0.918, "args": { "External id": 21384,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 3975 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651558499.302, "dur": 172.949, "args": { "External id": 21385,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651558518.419, "dur": 149.694, "args": { "External id": 21386,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 3977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651558537.540, "dur": 14.451, "args": { "External id": 21387,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651558557.037, "dur": 81.773, "args": { "External id": 21388,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 3979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651558560.465, "dur": 77.973, "args": { "External id": 21389,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 3980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558564.511, "dur": 6.931, "args": { "External id": 21390,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651558573.605, "dur": 64.228, "args": { "External id": 21391,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 3982 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.10", "pid": 1336754, "tid": 1381179, "ts": 1295651558810.532, "dur": 657.906, "args": { "External id": 21392,"Record function id": 0, "Ev Idx": 3983 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651558828.629, "dur": 626.323, "args": { "External id": 21393,"Record function id": 0, "Ev Idx": 3984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651558892.446, "dur": 5.338, "args": { "External id": 21394,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651558917.236, "dur": 27.298, "args": { "External id": 21395,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 3986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558922.156, "dur": 1.750, "args": { "External id": 21396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558926.088, "dur": 0.718, "args": { "External id": 21397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558928.696, "dur": 0.806, "args": { "External id": 21398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558930.923, "dur": 0.665, "args": { "External id": 21399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558933.339, "dur": 0.636, "args": { "External id": 21400,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558935.152, "dur": 0.565, "args": { "External id": 21401,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558936.871, "dur": 0.458, "args": { "External id": 21402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558938.765, "dur": 0.626, "args": { "External id": 21403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651558940.377, "dur": 0.716, "args": { "External id": 21404,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 3995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651558955.481, "dur": 68.147, "args": { "External id": 21405,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 3996 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651559063.032, "dur": 107.159, "args": { "External id": 21406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 3997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651559074.889, "dur": 4.603, "args": { "External id": 21407,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 3998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651559085.207, "dur": 11.523, "args": { "External id": 21408,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 3999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651559090.112, "dur": 6.224, "args": { "External id": 21409,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559093.578, "dur": 0.967, "args": { "External id": 21410,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651559104.245, "dur": 24.915, "args": { "External id": 21411,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559106.265, "dur": 0.858, "args": { "External id": 21412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559108.407, "dur": 0.243, "args": { "External id": 21413,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559110.020, "dur": 0.708, "args": { "External id": 21414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559112.010, "dur": 0.780, "args": { "External id": 21415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559114.308, "dur": 0.582, "args": { "External id": 21416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559115.934, "dur": 0.579, "args": { "External id": 21417,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559118.098, "dur": 0.346, "args": { "External id": 21418,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559119.945, "dur": 0.725, "args": { "External id": 21419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651559121.811, "dur": 0.521, "args": { "External id": 21420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651559140.600, "dur": 21.779, "args": { "External id": 21421,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4012 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651559219.981, "dur": 154.208, "args": { "External id": 21422,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4013 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651559269.348, "dur": 101.036, "args": { "External id": 21423,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4014, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651559279.657, "dur": 86.222, "args": { "External id": 21424,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4015 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651559393.682, "dur": 1.896, "args": { "External id": 21425,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4016, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651559484.111, "dur": 1806.271, "args": { "External id": 21426,"Sequence number": 246564, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4017 } }, { "ph": "f", "id": 204, "pid": 1336754, "tid": 1381179, "ts": 1295651559484.111, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651559622.191, "dur": 119.243, "args": { "External id": 21427,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4018 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651559793.682, "dur": 51.427, "args": { "External id": 21428,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651559862.602, "dur": 51.522, "args": { "External id": 21429,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651559923.633, "dur": 34.091, "args": { "External id": 21430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651559965.359, "dur": 88.186, "args": { "External id": 21431,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560065.981, "dur": 35.852, "args": { "External id": 21432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560110.807, "dur": 43.151, "args": { "External id": 21433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4024 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651560185.034, "dur": 26.402, "args": { "External id": 21434,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4025 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651560251.292, "dur": 38.898, "args": { "External id": 21435,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4026 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651560319.417, "dur": 21.281, "args": { "External id": 21436,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4027 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651560356.990, "dur": 16.757, "args": { "External id": 21437,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560383.918, "dur": 33.135, "args": { "External id": 21438,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560420.366, "dur": 32.750, "args": { "External id": 21439,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4030 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651560484.203, "dur": 206.680, "args": { "External id": 21440,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651560579.089, "dur": 7.078, "args": { "External id": 21441,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651560588.207, "dur": 3.058, "args": { "External id": 21442,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4033 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651560733.846, "dur": 26.966, "args": { "External id": 21443,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4034 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651560774.033, "dur": 16.619, "args": { "External id": 21444,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560799.094, "dur": 37.134, "args": { "External id": 21445,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560842.451, "dur": 34.533, "args": { "External id": 21446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560883.772, "dur": 20.480, "args": { "External id": 21447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560909.184, "dur": 29.861, "args": { "External id": 21448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560945.661, "dur": 22.646, "args": { "External id": 21449,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651560975.231, "dur": 68.058, "args": { "External id": 21450,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4041 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651561068.961, "dur": 25.369, "args": { "External id": 21451,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4042 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651561115.591, "dur": 24.422, "args": { "External id": 21452,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4043 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651561160.809, "dur": 15.833, "args": { "External id": 21453,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4044 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651561192.466, "dur": 15.283, "args": { "External id": 21454,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4045 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651561223.920, "dur": 32.936, "args": { "External id": 21455,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4046 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561342.210, "dur": 16.958, "args": { "External id": 21456,"Record function id": 0, "Ev Idx": 4047 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561345.762, "dur": 12.113, "args": { "External id": 21457,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561350.643, "dur": 6.356, "args": { "External id": 21458,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4049 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561352.467, "dur": 4.438, "args": { "External id": 21459,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4050 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561363.010, "dur": 5.034, "args": { "External id": 21460,"Record function id": 0, "Ev Idx": 4051 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561364.573, "dur": 3.043, "args": { "External id": 21461,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561365.245, "dur": 1.903, "args": { "External id": 21462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4053 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561365.805, "dur": 1.280, "args": { "External id": 21463,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4054 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561371.309, "dur": 7.678, "args": { "External id": 21464,"Record function id": 0, "Ev Idx": 4055 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561375.650, "dur": 2.869, "args": { "External id": 21465,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561376.417, "dur": 1.707, "args": { "External id": 21466,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4057 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561377.145, "dur": 0.883, "args": { "External id": 21467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4058 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561382.110, "dur": 4.089, "args": { "External id": 21468,"Record function id": 0, "Ev Idx": 4059 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561383.367, "dur": 2.438, "args": { "External id": 21469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561384.039, "dur": 1.311, "args": { "External id": 21470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4061 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561384.520, "dur": 0.708, "args": { "External id": 21471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4062 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561389.302, "dur": 4.238, "args": { "External id": 21472,"Record function id": 0, "Ev Idx": 4063 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561390.366, "dur": 2.760, "args": { "External id": 21473,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561391.146, "dur": 1.564, "args": { "External id": 21474,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4065 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561391.443, "dur": 1.200, "args": { "External id": 21475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4066 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561396.723, "dur": 4.061, "args": { "External id": 21476,"Record function id": 0, "Ev Idx": 4067 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561397.962, "dur": 2.392, "args": { "External id": 21477,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561398.572, "dur": 1.371, "args": { "External id": 21478,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4069 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561399.189, "dur": 0.654, "args": { "External id": 21479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4070 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561403.933, "dur": 3.844, "args": { "External id": 21480,"Record function id": 0, "Ev Idx": 4071 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561404.920, "dur": 2.422, "args": { "External id": 21481,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561405.690, "dur": 1.226, "args": { "External id": 21482,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4073 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561406.139, "dur": 0.711, "args": { "External id": 21483,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4074 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561410.784, "dur": 6.265, "args": { "External id": 21484,"Record function id": 0, "Ev Idx": 4075 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561412.109, "dur": 4.519, "args": { "External id": 21485,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561412.582, "dur": 3.640, "args": { "External id": 21486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4077 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561414.948, "dur": 1.167, "args": { "External id": 21487,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4078 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561420.109, "dur": 3.472, "args": { "External id": 21488,"Record function id": 0, "Ev Idx": 4079 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651561421.023, "dur": 2.160, "args": { "External id": 21489,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561421.475, "dur": 1.306, "args": { "External id": 21490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4081 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651561421.830, "dur": 0.869, "args": { "External id": 21491,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4082 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651561428.194, "dur": 36025.831, "args": { "External id": 21492,"Record function id": 0, "Sequence number": 246563, "Fwd thread id": 1, "Ev Idx": 4083 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651561429.505, "dur": 36014.003, "args": { "External id": 21493,"Sequence number": 246563, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4084 } }, { "ph": "f", "id": 205, "pid": 1336754, "tid": 1381179, "ts": 1295651561429.505, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651561466.449, "dur": 40.434, "args": { "External id": 21494,"Record function id": 0, "Ev Idx": 4085 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651561514.608, "dur": 70.171, "args": { "External id": 21495,"Record function id": 0, "Ev Idx": 4086 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.11)", "pid": 1336754, "tid": 1381179, "ts": 1295651561591.305, "dur": 35843.398, "args": { "External id": 21496,"Record function id": 0, "Ev Idx": 4087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651561688.833, "dur": 7.228, "args": { "External id": 21497,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651561709.797, "dur": 4.524, "args": { "External id": 21498,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4089 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651561730.431, "dur": 34884.764, "args": { "External id": 21499,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651561744.192, "dur": 34860.777, "args": { "External id": 21500,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651561820.465, "dur": 15.442, "args": { "External id": 21501,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651561848.475, "dur": 34717.888, "args": { "External id": 21502,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651561853.789, "dur": 34711.960, "args": { "External id": 21503,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651561857.225, "dur": 4.656, "args": { "External id": 21504,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651561890.784, "dur": 34671.105, "args": { "External id": 21505,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651596711.554, "dur": 9.109, "args": { "External id": 21506,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651596714.374, "dur": 5.941, "args": { "External id": 21507,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4098 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651596748.864, "dur": 366.606, "args": { "External id": 21508,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4099 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651596777.954, "dur": 332.559, "args": { "External id": 21509,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4100, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651596790.567, "dur": 314.284, "args": { "External id": 21510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4101 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651597140.969, "dur": 2.554, "args": { "External id": 21511,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4102, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597204.178, "dur": 6.501, "args": { "External id": 21512,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597274.125, "dur": 2.396, "args": { "External id": 21513,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597293.433, "dur": 1.821, "args": { "External id": 21514,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597306.893, "dur": 0.847, "args": { "External id": 21515,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597319.014, "dur": 1.203, "args": { "External id": 21516,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597329.768, "dur": 1.786, "args": { "External id": 21517,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597345.710, "dur": 1.060, "args": { "External id": 21518,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597360.772, "dur": 1.192, "args": { "External id": 21519,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597372.093, "dur": 1.437, "args": { "External id": 21520,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4111 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651597469.565, "dur": 2789.937, "args": { "External id": 21521,"Record function id": 0, "Ev Idx": 4112 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651597489.422, "dur": 1045.079, "args": { "External id": 21522,"Record function id": 0, "Ev Idx": 4113 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651597504.295, "dur": 316.926, "args": { "External id": 21523,"Record function id": 0, "Ev Idx": 4114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597585.851, "dur": 4.253, "args": { "External id": 21524,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597593.648, "dur": 1.847, "args": { "External id": 21525,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597597.470, "dur": 1.305, "args": { "External id": 21526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597600.415, "dur": 0.711, "args": { "External id": 21527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597605.663, "dur": 1.333, "args": { "External id": 21528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597608.482, "dur": 1.504, "args": { "External id": 21529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597611.670, "dur": 1.775, "args": { "External id": 21530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597614.796, "dur": 1.002, "args": { "External id": 21531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597619.616, "dur": 2.054, "args": { "External id": 21532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651597623.221, "dur": 1.047, "args": { "External id": 21533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4124 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651597642.056, "dur": 150.058, "args": { "External id": 21534,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651597658.716, "dur": 129.306, "args": { "External id": 21535,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651597675.791, "dur": 13.327, "args": { "External id": 21536,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651597693.080, "dur": 67.972, "args": { "External id": 21537,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651597695.890, "dur": 64.879, "args": { "External id": 21538,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651597699.579, "dur": 4.765, "args": { "External id": 21539,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651597705.898, "dur": 54.103, "args": { "External id": 21540,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4131 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.9", "pid": 1336754, "tid": 1381179, "ts": 1295651597909.368, "dur": 617.838, "args": { "External id": 21541,"Record function id": 0, "Ev Idx": 4132 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651597926.000, "dur": 588.272, "args": { "External id": 21542,"Record function id": 0, "Ev Idx": 4133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651598023.598, "dur": 7.011, "args": { "External id": 21543,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651598048.498, "dur": 31.199, "args": { "External id": 21544,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598053.771, "dur": 1.613, "args": { "External id": 21545,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598057.144, "dur": 0.307, "args": { "External id": 21546,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598059.493, "dur": 0.402, "args": { "External id": 21547,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598061.057, "dur": 0.238, "args": { "External id": 21548,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598062.497, "dur": 0.371, "args": { "External id": 21549,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598064.071, "dur": 0.441, "args": { "External id": 21550,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598071.552, "dur": 0.515, "args": { "External id": 21551,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598073.400, "dur": 0.632, "args": { "External id": 21552,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598075.125, "dur": 0.308, "args": { "External id": 21553,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651598090.313, "dur": 32.294, "args": { "External id": 21554,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4145 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651598160.492, "dur": 121.801, "args": { "External id": 21555,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651598170.600, "dur": 3.184, "args": { "External id": 21556,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651598178.894, "dur": 13.895, "args": { "External id": 21557,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651598186.410, "dur": 5.967, "args": { "External id": 21558,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598190.077, "dur": 0.886, "args": { "External id": 21559,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651598201.832, "dur": 22.463, "args": { "External id": 21560,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598203.320, "dur": 0.630, "args": { "External id": 21561,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598205.346, "dur": 0.630, "args": { "External id": 21562,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598207.252, "dur": 0.219, "args": { "External id": 21563,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598209.340, "dur": 0.402, "args": { "External id": 21564,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598210.750, "dur": 0.383, "args": { "External id": 21565,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598212.252, "dur": 0.478, "args": { "External id": 21566,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598213.557, "dur": 0.438, "args": { "External id": 21567,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598216.155, "dur": 0.606, "args": { "External id": 21568,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651598217.697, "dur": 0.732, "args": { "External id": 21569,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651598253.470, "dur": 21.075, "args": { "External id": 21570,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4161 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651598329.769, "dur": 116.920, "args": { "External id": 21571,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4162 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651598357.746, "dur": 85.797, "args": { "External id": 21572,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4163, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651598366.975, "dur": 72.988, "args": { "External id": 21573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4164 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651598464.200, "dur": 1.917, "args": { "External id": 21574,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4165, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651598541.361, "dur": 1676.488, "args": { "External id": 21575,"Sequence number": 246562, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4166 } }, { "ph": "f", "id": 206, "pid": 1336754, "tid": 1381179, "ts": 1295651598541.361, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651598657.431, "dur": 107.555, "args": { "External id": 21576,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651598804.344, "dur": 44.316, "args": { "External id": 21577,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651598864.405, "dur": 48.245, "args": { "External id": 21578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651598921.995, "dur": 32.739, "args": { "External id": 21579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651598961.946, "dur": 88.580, "args": { "External id": 21580,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599062.261, "dur": 32.998, "args": { "External id": 21581,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599104.078, "dur": 42.667, "args": { "External id": 21582,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4173 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651599177.566, "dur": 24.383, "args": { "External id": 21583,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4174 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651599247.350, "dur": 32.661, "args": { "External id": 21584,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4175 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651599308.722, "dur": 19.266, "args": { "External id": 21585,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4176 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651599341.322, "dur": 18.117, "args": { "External id": 21586,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599369.157, "dur": 32.905, "args": { "External id": 21587,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599405.794, "dur": 37.785, "args": { "External id": 21588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4179 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651599473.494, "dur": 177.757, "args": { "External id": 21589,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651599561.936, "dur": 6.684, "args": { "External id": 21590,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651599570.693, "dur": 2.089, "args": { "External id": 21591,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4182 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651599683.139, "dur": 22.679, "args": { "External id": 21592,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4183 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651599715.825, "dur": 13.838, "args": { "External id": 21593,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599738.321, "dur": 33.696, "args": { "External id": 21594,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599778.020, "dur": 34.040, "args": { "External id": 21595,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599819.905, "dur": 20.466, "args": { "External id": 21596,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599845.190, "dur": 33.086, "args": { "External id": 21597,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599884.197, "dur": 18.741, "args": { "External id": 21598,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651599913.046, "dur": 45.473, "args": { "External id": 21599,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4190 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651599983.969, "dur": 60.247, "args": { "External id": 21600,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4191 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651600066.187, "dur": 23.522, "args": { "External id": 21601,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651600106.317, "dur": 19.173, "args": { "External id": 21602,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4193 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651600141.908, "dur": 15.871, "args": { "External id": 21603,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651600172.385, "dur": 18.130, "args": { "External id": 21604,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4195 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600283.238, "dur": 19.264, "args": { "External id": 21605,"Record function id": 0, "Ev Idx": 4196 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600286.692, "dur": 14.514, "args": { "External id": 21606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600290.745, "dur": 9.229, "args": { "External id": 21607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4198 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600295.438, "dur": 4.412, "args": { "External id": 21608,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4199 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600306.450, "dur": 5.155, "args": { "External id": 21609,"Record function id": 0, "Ev Idx": 4200 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600307.677, "dur": 3.495, "args": { "External id": 21610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600308.479, "dur": 2.207, "args": { "External id": 21611,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4202 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600309.396, "dur": 1.225, "args": { "External id": 21612,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4203 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600314.796, "dur": 4.180, "args": { "External id": 21613,"Record function id": 0, "Ev Idx": 4204 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600315.958, "dur": 2.594, "args": { "External id": 21614,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600316.690, "dur": 1.428, "args": { "External id": 21615,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4206 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600317.277, "dur": 0.741, "args": { "External id": 21616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4207 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600322.158, "dur": 3.825, "args": { "External id": 21617,"Record function id": 0, "Ev Idx": 4208 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600323.146, "dur": 2.460, "args": { "External id": 21618,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600323.792, "dur": 1.356, "args": { "External id": 21619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4210 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600324.339, "dur": 0.696, "args": { "External id": 21620,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4211 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600329.023, "dur": 3.629, "args": { "External id": 21621,"Record function id": 0, "Ev Idx": 4212 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600329.919, "dur": 2.336, "args": { "External id": 21622,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600330.449, "dur": 1.351, "args": { "External id": 21623,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4214 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600330.707, "dur": 1.031, "args": { "External id": 21624,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4215 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600335.802, "dur": 3.681, "args": { "External id": 21625,"Record function id": 0, "Ev Idx": 4216 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600336.762, "dur": 2.308, "args": { "External id": 21626,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600337.239, "dur": 1.237, "args": { "External id": 21627,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4218 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600337.748, "dur": 0.664, "args": { "External id": 21628,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4219 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600342.633, "dur": 3.559, "args": { "External id": 21629,"Record function id": 0, "Ev Idx": 4220 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600343.622, "dur": 2.187, "args": { "External id": 21630,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600344.143, "dur": 1.191, "args": { "External id": 21631,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4222 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600344.792, "dur": 0.480, "args": { "External id": 21632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4223 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600349.412, "dur": 4.900, "args": { "External id": 21633,"Record function id": 0, "Ev Idx": 4224 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600350.719, "dur": 3.193, "args": { "External id": 21634,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600351.522, "dur": 1.959, "args": { "External id": 21635,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4226 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600352.037, "dur": 1.384, "args": { "External id": 21636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4227 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600357.501, "dur": 5.711, "args": { "External id": 21637,"Record function id": 0, "Ev Idx": 4228 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651600358.784, "dur": 4.030, "args": { "External id": 21638,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600359.656, "dur": 2.710, "args": { "External id": 21639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4230 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651600361.634, "dur": 0.669, "args": { "External id": 21640,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4231 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651600366.998, "dur": 36178.700, "args": { "External id": 21641,"Record function id": 0, "Sequence number": 246561, "Fwd thread id": 1, "Ev Idx": 4232 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651600368.348, "dur": 36167.898, "args": { "External id": 21642,"Sequence number": 246561, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4233 } }, { "ph": "f", "id": 207, "pid": 1336754, "tid": 1381179, "ts": 1295651600368.348, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651600397.979, "dur": 37.004, "args": { "External id": 21643,"Record function id": 0, "Ev Idx": 4234 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651600444.985, "dur": 66.885, "args": { "External id": 21644,"Record function id": 0, "Ev Idx": 4235 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.10)", "pid": 1336754, "tid": 1381179, "ts": 1295651600518.149, "dur": 36010.508, "args": { "External id": 21645,"Record function id": 0, "Ev Idx": 4236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651600609.600, "dur": 6.947, "args": { "External id": 21646,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651600626.188, "dur": 4.604, "args": { "External id": 21647,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4238 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651600645.197, "dur": 35074.399, "args": { "External id": 21648,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651600660.259, "dur": 35048.577, "args": { "External id": 21649,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651600717.618, "dur": 18.344, "args": { "External id": 21650,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651600745.799, "dur": 34919.804, "args": { "External id": 21651,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651600748.503, "dur": 34916.456, "args": { "External id": 21652,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651600755.980, "dur": 5.721, "args": { "External id": 21653,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651600763.354, "dur": 34897.094, "args": { "External id": 21654,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651635818.850, "dur": 11.577, "args": { "External id": 21655,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651635822.147, "dur": 7.930, "args": { "External id": 21656,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4247 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651635860.078, "dur": 360.214, "args": { "External id": 21657,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4248 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651635892.876, "dur": 322.074, "args": { "External id": 21658,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4249, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651635904.281, "dur": 304.733, "args": { "External id": 21659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4250 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651636257.934, "dur": 3.391, "args": { "External id": 21660,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4251, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636328.263, "dur": 7.214, "args": { "External id": 21661,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636380.658, "dur": 1.435, "args": { "External id": 21662,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636397.270, "dur": 1.636, "args": { "External id": 21663,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636410.603, "dur": 0.766, "args": { "External id": 21664,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636422.289, "dur": 0.857, "args": { "External id": 21665,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636431.696, "dur": 1.087, "args": { "External id": 21666,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636443.505, "dur": 0.720, "args": { "External id": 21667,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636454.188, "dur": 1.086, "args": { "External id": 21668,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636463.874, "dur": 1.043, "args": { "External id": 21669,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4260 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651636561.227, "dur": 2785.543, "args": { "External id": 21670,"Record function id": 0, "Ev Idx": 4261 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651636581.896, "dur": 1041.827, "args": { "External id": 21671,"Record function id": 0, "Ev Idx": 4262 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651636597.266, "dur": 326.839, "args": { "External id": 21672,"Record function id": 0, "Ev Idx": 4263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636679.972, "dur": 4.842, "args": { "External id": 21673,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636691.551, "dur": 1.750, "args": { "External id": 21674,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636695.328, "dur": 1.103, "args": { "External id": 21675,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636700.079, "dur": 1.495, "args": { "External id": 21676,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636703.001, "dur": 1.513, "args": { "External id": 21677,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636706.245, "dur": 1.134, "args": { "External id": 21678,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636709.015, "dur": 1.295, "args": { "External id": 21679,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636714.206, "dur": 0.830, "args": { "External id": 21680,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636716.202, "dur": 1.333, "args": { "External id": 21681,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651636718.945, "dur": 1.555, "args": { "External id": 21682,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4273 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651636737.920, "dur": 155.797, "args": { "External id": 21683,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651636754.357, "dur": 135.244, "args": { "External id": 21684,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651636770.070, "dur": 12.941, "args": { "External id": 21685,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651636786.335, "dur": 75.889, "args": { "External id": 21686,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651636791.648, "dur": 70.242, "args": { "External id": 21687,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651636795.326, "dur": 6.174, "args": { "External id": 21688,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651636805.079, "dur": 56.199, "args": { "External id": 21689,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4280 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.8", "pid": 1336754, "tid": 1381179, "ts": 1295651637053.865, "dur": 562.730, "args": { "External id": 21690,"Record function id": 0, "Ev Idx": 4281 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651637072.431, "dur": 531.505, "args": { "External id": 21691,"Record function id": 0, "Ev Idx": 4282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651637134.283, "dur": 6.066, "args": { "External id": 21692,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651637156.561, "dur": 28.059, "args": { "External id": 21693,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637161.956, "dur": 1.841, "args": { "External id": 21694,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637166.109, "dur": 0.271, "args": { "External id": 21695,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637168.460, "dur": 0.388, "args": { "External id": 21696,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637170.449, "dur": 0.604, "args": { "External id": 21697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637172.629, "dur": 0.500, "args": { "External id": 21698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637174.696, "dur": 0.985, "args": { "External id": 21699,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637177.747, "dur": 0.405, "args": { "External id": 21700,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637178.892, "dur": 0.870, "args": { "External id": 21701,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637180.483, "dur": 0.320, "args": { "External id": 21702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651637194.839, "dur": 31.214, "args": { "External id": 21703,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651637274.857, "dur": 101.021, "args": { "External id": 21704,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651637285.862, "dur": 4.672, "args": { "External id": 21705,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651637296.082, "dur": 11.300, "args": { "External id": 21706,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651637300.324, "dur": 6.650, "args": { "External id": 21707,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637304.387, "dur": 0.588, "args": { "External id": 21708,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651637314.368, "dur": 23.865, "args": { "External id": 21709,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637316.579, "dur": 0.559, "args": { "External id": 21710,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637318.474, "dur": 1.210, "args": { "External id": 21711,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637320.993, "dur": 0.318, "args": { "External id": 21712,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637321.985, "dur": 0.973, "args": { "External id": 21713,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637323.878, "dur": 0.211, "args": { "External id": 21714,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637324.974, "dur": 0.781, "args": { "External id": 21715,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637327.160, "dur": 0.491, "args": { "External id": 21716,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637328.614, "dur": 1.022, "args": { "External id": 21717,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651637330.847, "dur": 0.379, "args": { "External id": 21718,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651637348.795, "dur": 19.913, "args": { "External id": 21719,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4310 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651637420.156, "dur": 116.920, "args": { "External id": 21720,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4311 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651637448.438, "dur": 85.299, "args": { "External id": 21721,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4312, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651637457.890, "dur": 71.923, "args": { "External id": 21722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4313 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651637554.494, "dur": 1.822, "args": { "External id": 21723,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4314, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651637631.270, "dur": 1690.252, "args": { "External id": 21724,"Sequence number": 246560, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4315 } }, { "ph": "f", "id": 208, "pid": 1336754, "tid": 1381179, "ts": 1295651637631.270, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651637744.248, "dur": 103.428, "args": { "External id": 21725,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4316 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651637886.777, "dur": 41.650, "args": { "External id": 21726,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651637944.837, "dur": 91.337, "args": { "External id": 21727,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638050.966, "dur": 38.700, "args": { "External id": 21728,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638096.502, "dur": 46.318, "args": { "External id": 21729,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638150.732, "dur": 27.369, "args": { "External id": 21730,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638186.634, "dur": 57.992, "args": { "External id": 21731,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4322 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651638278.922, "dur": 24.428, "args": { "External id": 21732,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4323 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651638322.879, "dur": 34.153, "args": { "External id": 21733,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4324 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651638380.765, "dur": 18.354, "args": { "External id": 21734,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651638413.563, "dur": 14.433, "args": { "External id": 21735,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638436.975, "dur": 33.264, "args": { "External id": 21736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638476.977, "dur": 33.711, "args": { "External id": 21737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4328 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651638541.243, "dur": 177.322, "args": { "External id": 21738,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651638624.239, "dur": 6.198, "args": { "External id": 21739,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651638632.190, "dur": 2.348, "args": { "External id": 21740,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4331 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651638750.037, "dur": 26.966, "args": { "External id": 21741,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4332 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651638787.376, "dur": 13.688, "args": { "External id": 21742,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638808.288, "dur": 36.663, "args": { "External id": 21743,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638850.912, "dur": 36.720, "args": { "External id": 21744,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638894.273, "dur": 20.292, "args": { "External id": 21745,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638921.298, "dur": 30.489, "args": { "External id": 21746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638957.319, "dur": 19.576, "args": { "External id": 21747,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651638983.857, "dur": 89.012, "args": { "External id": 21748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4339 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651639107.411, "dur": 24.159, "args": { "External id": 21749,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4340 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651639152.576, "dur": 22.549, "args": { "External id": 21750,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4341 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651639198.539, "dur": 15.789, "args": { "External id": 21751,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4342 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651639244.845, "dur": 18.237, "args": { "External id": 21752,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4343 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651639278.149, "dur": 15.053, "args": { "External id": 21753,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4344 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639368.682, "dur": 15.607, "args": { "External id": 21754,"Record function id": 0, "Ev Idx": 4345 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639372.100, "dur": 11.042, "args": { "External id": 21755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639376.126, "dur": 6.133, "args": { "External id": 21756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4347 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639377.643, "dur": 4.526, "args": { "External id": 21757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4348 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639388.354, "dur": 4.828, "args": { "External id": 21758,"Record function id": 0, "Ev Idx": 4349 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639389.675, "dur": 2.971, "args": { "External id": 21759,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639390.668, "dur": 1.434, "args": { "External id": 21760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4351 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639391.208, "dur": 0.825, "args": { "External id": 21761,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4352 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639396.638, "dur": 4.488, "args": { "External id": 21762,"Record function id": 0, "Ev Idx": 4353 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639397.835, "dur": 2.879, "args": { "External id": 21763,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639398.384, "dur": 1.897, "args": { "External id": 21764,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4355 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639399.299, "dur": 0.896, "args": { "External id": 21765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4356 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639404.329, "dur": 3.449, "args": { "External id": 21766,"Record function id": 0, "Ev Idx": 4357 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639405.331, "dur": 2.052, "args": { "External id": 21767,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639405.955, "dur": 0.901, "args": { "External id": 21768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4359 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639406.217, "dur": 0.559, "args": { "External id": 21769,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4360 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639410.850, "dur": 3.561, "args": { "External id": 21770,"Record function id": 0, "Ev Idx": 4361 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639411.980, "dur": 1.980, "args": { "External id": 21771,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639412.467, "dur": 0.999, "args": { "External id": 21772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4363 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639412.802, "dur": 0.578, "args": { "External id": 21773,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4364 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639417.462, "dur": 3.939, "args": { "External id": 21774,"Record function id": 0, "Ev Idx": 4365 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639418.526, "dur": 2.494, "args": { "External id": 21775,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639419.304, "dur": 1.294, "args": { "External id": 21776,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4367 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639419.773, "dur": 0.728, "args": { "External id": 21777,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4368 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639424.597, "dur": 5.498, "args": { "External id": 21778,"Record function id": 0, "Ev Idx": 4369 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639425.716, "dur": 3.983, "args": { "External id": 21779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639426.219, "dur": 3.035, "args": { "External id": 21780,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4371 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639428.478, "dur": 0.708, "args": { "External id": 21781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4372 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639433.182, "dur": 3.835, "args": { "External id": 21782,"Record function id": 0, "Ev Idx": 4373 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639434.267, "dur": 2.341, "args": { "External id": 21783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639434.932, "dur": 1.207, "args": { "External id": 21784,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4375 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639435.448, "dur": 0.628, "args": { "External id": 21785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4376 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639440.050, "dur": 3.359, "args": { "External id": 21786,"Record function id": 0, "Ev Idx": 4377 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651639440.898, "dur": 2.099, "args": { "External id": 21787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639441.384, "dur": 1.145, "args": { "External id": 21788,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4379 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651639441.658, "dur": 0.803, "args": { "External id": 21789,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4380 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651639447.471, "dur": 35864.802, "args": { "External id": 21790,"Record function id": 0, "Sequence number": 246559, "Fwd thread id": 1, "Ev Idx": 4381 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651639448.636, "dur": 35852.349, "args": { "External id": 21791,"Sequence number": 246559, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4382 } }, { "ph": "f", "id": 209, "pid": 1336754, "tid": 1381179, "ts": 1295651639448.636, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651639476.846, "dur": 39.234, "args": { "External id": 21792,"Record function id": 0, "Ev Idx": 4383 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651639523.256, "dur": 61.011, "args": { "External id": 21793,"Record function id": 0, "Ev Idx": 4384 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.9)", "pid": 1336754, "tid": 1381179, "ts": 1295651639592.128, "dur": 35700.404, "args": { "External id": 21794,"Record function id": 0, "Ev Idx": 4385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651639680.160, "dur": 6.658, "args": { "External id": 21795,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651639696.440, "dur": 4.717, "args": { "External id": 21796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4387 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651639715.556, "dur": 34706.501, "args": { "External id": 21797,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651639729.842, "dur": 34681.535, "args": { "External id": 21798,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651639783.184, "dur": 13.740, "args": { "External id": 21799,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651639805.142, "dur": 34565.464, "args": { "External id": 21800,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651639807.882, "dur": 34561.852, "args": { "External id": 21801,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651639811.501, "dur": 4.940, "args": { "External id": 21802,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651639818.017, "dur": 34546.181, "args": { "External id": 21803,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651674527.119, "dur": 12.639, "args": { "External id": 21804,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651674530.470, "dur": 8.887, "args": { "External id": 21805,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4396 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651674568.866, "dur": 381.940, "args": { "External id": 21806,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4397 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651674600.653, "dur": 345.048, "args": { "External id": 21807,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4398, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651674613.989, "dur": 325.888, "args": { "External id": 21808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4399 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651674972.204, "dur": 2.475, "args": { "External id": 21809,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4400, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675070.750, "dur": 7.277, "args": { "External id": 21810,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675123.111, "dur": 1.545, "args": { "External id": 21811,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675139.908, "dur": 1.261, "args": { "External id": 21812,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675151.898, "dur": 1.054, "args": { "External id": 21813,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675164.379, "dur": 1.026, "args": { "External id": 21814,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675178.676, "dur": 0.727, "args": { "External id": 21815,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675189.352, "dur": 1.145, "args": { "External id": 21816,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675202.254, "dur": 1.182, "args": { "External id": 21817,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675213.032, "dur": 0.958, "args": { "External id": 21818,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4409 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651675327.842, "dur": 2755.551, "args": { "External id": 21819,"Record function id": 0, "Ev Idx": 4410 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651675347.832, "dur": 1027.523, "args": { "External id": 21820,"Record function id": 0, "Ev Idx": 4411 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651675364.077, "dur": 322.040, "args": { "External id": 21821,"Record function id": 0, "Ev Idx": 4412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675451.978, "dur": 4.689, "args": { "External id": 21822,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675460.134, "dur": 1.723, "args": { "External id": 21823,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675463.815, "dur": 1.143, "args": { "External id": 21824,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675468.247, "dur": 1.331, "args": { "External id": 21825,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675471.127, "dur": 0.943, "args": { "External id": 21826,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675473.672, "dur": 1.092, "args": { "External id": 21827,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675476.538, "dur": 1.239, "args": { "External id": 21828,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675481.834, "dur": 1.479, "args": { "External id": 21829,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675484.949, "dur": 0.944, "args": { "External id": 21830,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651675487.272, "dur": 1.347, "args": { "External id": 21831,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4422 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651675508.952, "dur": 150.294, "args": { "External id": 21832,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651675524.864, "dur": 129.823, "args": { "External id": 21833,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651675541.325, "dur": 12.704, "args": { "External id": 21834,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651675557.441, "dur": 69.878, "args": { "External id": 21835,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651675560.242, "dur": 66.734, "args": { "External id": 21836,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675563.657, "dur": 5.244, "args": { "External id": 21837,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651675572.617, "dur": 53.806, "args": { "External id": 21838,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4429 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.7", "pid": 1336754, "tid": 1381179, "ts": 1295651675774.675, "dur": 593.306, "args": { "External id": 21839,"Record function id": 0, "Ev Idx": 4430 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651675790.427, "dur": 565.396, "args": { "External id": 21840,"Record function id": 0, "Ev Idx": 4431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651675850.404, "dur": 4.844, "args": { "External id": 21841,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651675871.520, "dur": 24.865, "args": { "External id": 21842,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675876.083, "dur": 1.540, "args": { "External id": 21843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675879.532, "dur": 0.439, "args": { "External id": 21844,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675882.153, "dur": 0.522, "args": { "External id": 21845,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675883.886, "dur": 0.172, "args": { "External id": 21846,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675885.063, "dur": 0.990, "args": { "External id": 21847,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675887.813, "dur": 0.359, "args": { "External id": 21848,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675888.933, "dur": 0.699, "args": { "External id": 21849,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675891.299, "dur": 0.505, "args": { "External id": 21850,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651675892.674, "dur": 0.323, "args": { "External id": 21851,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651675906.071, "dur": 27.950, "args": { "External id": 21852,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4443 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651675963.423, "dur": 138.483, "args": { "External id": 21853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651675972.766, "dur": 3.443, "args": { "External id": 21854,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651676017.601, "dur": 11.870, "args": { "External id": 21855,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651676022.633, "dur": 6.411, "args": { "External id": 21856,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676026.482, "dur": 0.732, "args": { "External id": 21857,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651676038.491, "dur": 20.046, "args": { "External id": 21858,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676040.377, "dur": 0.342, "args": { "External id": 21859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676042.308, "dur": 0.308, "args": { "External id": 21860,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676043.938, "dur": 0.628, "args": { "External id": 21861,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676045.350, "dur": 0.214, "args": { "External id": 21862,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676046.443, "dur": 0.553, "args": { "External id": 21863,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676048.596, "dur": 0.398, "args": { "External id": 21864,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676049.869, "dur": 0.524, "args": { "External id": 21865,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676051.681, "dur": 0.607, "args": { "External id": 21866,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651676053.138, "dur": 0.199, "args": { "External id": 21867,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651676072.531, "dur": 21.259, "args": { "External id": 21868,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4459 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651676146.140, "dur": 135.807, "args": { "External id": 21869,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4460 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651676174.260, "dur": 103.870, "args": { "External id": 21870,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4461, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651676183.569, "dur": 90.057, "args": { "External id": 21871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4462 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651676302.880, "dur": 1.924, "args": { "External id": 21872,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4463, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651676383.523, "dur": 1675.885, "args": { "External id": 21873,"Sequence number": 246558, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4464 } }, { "ph": "f", "id": 210, "pid": 1336754, "tid": 1381179, "ts": 1295651676383.523, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651676495.784, "dur": 111.073, "args": { "External id": 21874,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4465 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651676646.982, "dur": 42.927, "args": { "External id": 21875,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651676706.248, "dur": 50.011, "args": { "External id": 21876,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651676766.198, "dur": 34.425, "args": { "External id": 21877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651676807.107, "dur": 46.051, "args": { "External id": 21878,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651676861.893, "dur": 28.696, "args": { "External id": 21879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651676898.608, "dur": 42.575, "args": { "External id": 21880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4471 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651676966.638, "dur": 64.152, "args": { "External id": 21881,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4472 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651677052.651, "dur": 34.247, "args": { "External id": 21882,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4473 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651677110.760, "dur": 22.369, "args": { "External id": 21883,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4474 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651677147.465, "dur": 14.683, "args": { "External id": 21884,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677170.361, "dur": 35.926, "args": { "External id": 21885,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677209.741, "dur": 52.929, "args": { "External id": 21886,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4477 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651677293.700, "dur": 175.103, "args": { "External id": 21887,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651677378.804, "dur": 6.279, "args": { "External id": 21888,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651677386.793, "dur": 1.907, "args": { "External id": 21889,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4480 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651677504.063, "dur": 26.019, "args": { "External id": 21890,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4481 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651677542.592, "dur": 13.563, "args": { "External id": 21891,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677563.972, "dur": 49.245, "args": { "External id": 21892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677619.278, "dur": 39.542, "args": { "External id": 21893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677665.411, "dur": 23.272, "args": { "External id": 21894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677693.423, "dur": 41.642, "args": { "External id": 21895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677748.598, "dur": 23.739, "args": { "External id": 21896,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651677778.885, "dur": 32.076, "args": { "External id": 21897,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4488 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651677835.385, "dur": 22.849, "args": { "External id": 21898,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4489 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651677880.423, "dur": 23.367, "args": { "External id": 21899,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4490 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651677919.419, "dur": 16.267, "args": { "External id": 21900,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4491 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651677951.437, "dur": 13.342, "args": { "External id": 21901,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4492 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651677977.028, "dur": 50.917, "args": { "External id": 21902,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4493 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678106.041, "dur": 15.069, "args": { "External id": 21903,"Record function id": 0, "Ev Idx": 4494 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678109.406, "dur": 10.695, "args": { "External id": 21904,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678113.471, "dur": 5.778, "args": { "External id": 21905,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4496 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678114.940, "dur": 4.188, "args": { "External id": 21906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4497 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678124.921, "dur": 5.523, "args": { "External id": 21907,"Record function id": 0, "Ev Idx": 4498 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678126.514, "dur": 3.500, "args": { "External id": 21908,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678127.804, "dur": 1.689, "args": { "External id": 21909,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4500 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678128.514, "dur": 0.910, "args": { "External id": 21910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4501 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678133.765, "dur": 6.461, "args": { "External id": 21911,"Record function id": 0, "Ev Idx": 4502 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678135.185, "dur": 4.612, "args": { "External id": 21912,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678136.213, "dur": 2.856, "args": { "External id": 21913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4504 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678136.932, "dur": 2.026, "args": { "External id": 21914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4505 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678143.479, "dur": 4.187, "args": { "External id": 21915,"Record function id": 0, "Ev Idx": 4506 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678144.578, "dur": 2.640, "args": { "External id": 21916,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678145.294, "dur": 1.361, "args": { "External id": 21917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4508 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678145.703, "dur": 0.860, "args": { "External id": 21918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4509 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678150.766, "dur": 4.096, "args": { "External id": 21919,"Record function id": 0, "Ev Idx": 4510 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678152.094, "dur": 2.340, "args": { "External id": 21920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678152.745, "dur": 1.293, "args": { "External id": 21921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4512 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678153.323, "dur": 0.651, "args": { "External id": 21922,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4513 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678158.134, "dur": 4.247, "args": { "External id": 21923,"Record function id": 0, "Ev Idx": 4514 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678159.190, "dur": 2.764, "args": { "External id": 21924,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678160.041, "dur": 1.516, "args": { "External id": 21925,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4516 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678160.819, "dur": 0.672, "args": { "External id": 21926,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4517 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678165.557, "dur": 6.061, "args": { "External id": 21927,"Record function id": 0, "Ev Idx": 4518 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678166.552, "dur": 4.642, "args": { "External id": 21928,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678167.232, "dur": 3.303, "args": { "External id": 21929,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4520 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678169.834, "dur": 0.615, "args": { "External id": 21930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4521 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678177.756, "dur": 3.927, "args": { "External id": 21931,"Record function id": 0, "Ev Idx": 4522 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678178.743, "dur": 2.526, "args": { "External id": 21932,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678179.641, "dur": 1.221, "args": { "External id": 21933,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4524 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678179.923, "dur": 0.854, "args": { "External id": 21934,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4525 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678184.701, "dur": 3.408, "args": { "External id": 21935,"Record function id": 0, "Ev Idx": 4526 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651678185.570, "dur": 2.117, "args": { "External id": 21936,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678186.134, "dur": 1.009, "args": { "External id": 21937,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4528 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651678186.438, "dur": 0.639, "args": { "External id": 21938,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4529 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651678191.799, "dur": 36095.551, "args": { "External id": 21939,"Record function id": 0, "Sequence number": 246557, "Fwd thread id": 1, "Ev Idx": 4530 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651678193.114, "dur": 36084.022, "args": { "External id": 21940,"Sequence number": 246557, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4531 } }, { "ph": "f", "id": 211, "pid": 1336754, "tid": 1381179, "ts": 1295651678193.114, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651678223.316, "dur": 56.326, "args": { "External id": 21941,"Record function id": 0, "Ev Idx": 4532 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651678288.880, "dur": 64.821, "args": { "External id": 21942,"Record function id": 0, "Ev Idx": 4533 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.8)", "pid": 1336754, "tid": 1381179, "ts": 1295651678359.526, "dur": 35908.997, "args": { "External id": 21943,"Record function id": 0, "Ev Idx": 4534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651678450.105, "dur": 7.227, "args": { "External id": 21944,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651678467.545, "dur": 4.633, "args": { "External id": 21945,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4536 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651678489.247, "dur": 34934.708, "args": { "External id": 21946,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651678503.085, "dur": 34912.732, "args": { "External id": 21947,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651678546.789, "dur": 17.842, "args": { "External id": 21948,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651678571.351, "dur": 34806.695, "args": { "External id": 21949,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651678573.886, "dur": 34803.607, "args": { "External id": 21950,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651678577.854, "dur": 5.635, "args": { "External id": 21951,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651678585.113, "dur": 34788.972, "args": { "External id": 21952,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651713510.476, "dur": 9.877, "args": { "External id": 21953,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651713513.225, "dur": 6.804, "args": { "External id": 21954,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4545 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651713547.010, "dur": 378.542, "args": { "External id": 21955,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4546 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651713577.131, "dur": 343.448, "args": { "External id": 21956,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4547, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651713588.274, "dur": 326.902, "args": { "External id": 21957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4548 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651713945.567, "dur": 2.296, "args": { "External id": 21958,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4549, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714042.716, "dur": 7.477, "args": { "External id": 21959,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714094.648, "dur": 2.038, "args": { "External id": 21960,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714111.570, "dur": 1.255, "args": { "External id": 21961,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714124.918, "dur": 1.052, "args": { "External id": 21962,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714141.255, "dur": 0.916, "args": { "External id": 21963,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714151.074, "dur": 1.122, "args": { "External id": 21964,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714162.540, "dur": 0.751, "args": { "External id": 21965,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714173.678, "dur": 1.673, "args": { "External id": 21966,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714184.415, "dur": 1.156, "args": { "External id": 21967,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4558 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651714303.303, "dur": 2751.519, "args": { "External id": 21968,"Record function id": 0, "Ev Idx": 4559 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651714323.193, "dur": 1067.013, "args": { "External id": 21969,"Record function id": 0, "Ev Idx": 4560 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651714337.263, "dur": 316.409, "args": { "External id": 21970,"Record function id": 0, "Ev Idx": 4561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714423.420, "dur": 5.227, "args": { "External id": 21971,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714431.640, "dur": 1.191, "args": { "External id": 21972,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714436.295, "dur": 1.430, "args": { "External id": 21973,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714439.500, "dur": 0.695, "args": { "External id": 21974,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714441.822, "dur": 1.741, "args": { "External id": 21975,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714445.056, "dur": 1.423, "args": { "External id": 21976,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714449.707, "dur": 1.826, "args": { "External id": 21977,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714453.326, "dur": 1.012, "args": { "External id": 21978,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714455.649, "dur": 0.992, "args": { "External id": 21979,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651714458.420, "dur": 1.031, "args": { "External id": 21980,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4571 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651714480.858, "dur": 146.371, "args": { "External id": 21981,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651714496.055, "dur": 126.566, "args": { "External id": 21982,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651714511.599, "dur": 12.940, "args": { "External id": 21983,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651714528.098, "dur": 68.050, "args": { "External id": 21984,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651714530.795, "dur": 64.995, "args": { "External id": 21985,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714534.648, "dur": 5.722, "args": { "External id": 21986,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651714542.228, "dur": 53.054, "args": { "External id": 21987,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4578 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.6", "pid": 1336754, "tid": 1381179, "ts": 1295651714746.852, "dur": 635.046, "args": { "External id": 21988,"Record function id": 0, "Ev Idx": 4579 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651714762.876, "dur": 605.685, "args": { "External id": 21989,"Record function id": 0, "Ev Idx": 4580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651714824.330, "dur": 4.254, "args": { "External id": 21990,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651714844.272, "dur": 27.235, "args": { "External id": 21991,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714849.562, "dur": 1.954, "args": { "External id": 21992,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714853.592, "dur": 0.648, "args": { "External id": 21993,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714855.216, "dur": 0.539, "args": { "External id": 21994,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714857.653, "dur": 0.583, "args": { "External id": 21995,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714859.796, "dur": 0.310, "args": { "External id": 21996,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714861.315, "dur": 1.493, "args": { "External id": 21997,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714864.486, "dur": 0.360, "args": { "External id": 21998,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714865.724, "dur": 1.053, "args": { "External id": 21999,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714867.836, "dur": 0.869, "args": { "External id": 22000,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651714881.549, "dur": 30.745, "args": { "External id": 22001,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4592 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651714941.999, "dur": 160.608, "args": { "External id": 22002,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651714950.946, "dur": 3.054, "args": { "External id": 22003,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651714958.759, "dur": 14.684, "args": { "External id": 22004,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651714963.530, "dur": 9.485, "args": { "External id": 22005,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651714970.714, "dur": 0.464, "args": { "External id": 22006,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651714980.351, "dur": 59.285, "args": { "External id": 22007,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715019.333, "dur": 0.945, "args": { "External id": 22008,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715021.974, "dur": 0.574, "args": { "External id": 22009,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715023.763, "dur": 1.059, "args": { "External id": 22010,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715026.107, "dur": 0.212, "args": { "External id": 22011,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715027.617, "dur": 0.169, "args": { "External id": 22012,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715029.303, "dur": 0.590, "args": { "External id": 22013,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715031.278, "dur": 0.329, "args": { "External id": 22014,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715032.573, "dur": 0.189, "args": { "External id": 22015,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651715034.140, "dur": 0.409, "args": { "External id": 22016,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651715071.845, "dur": 23.104, "args": { "External id": 22017,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4608 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651715152.525, "dur": 138.872, "args": { "External id": 22018,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4609 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651715179.728, "dur": 107.992, "args": { "External id": 22019,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4610, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651715188.787, "dur": 94.552, "args": { "External id": 22020,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4611 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651715313.038, "dur": 1.873, "args": { "External id": 22021,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4612, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651715397.356, "dur": 1630.990, "args": { "External id": 22022,"Sequence number": 246556, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4613 } }, { "ph": "f", "id": 212, "pid": 1336754, "tid": 1381179, "ts": 1295651715397.356, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651715509.973, "dur": 103.802, "args": { "External id": 22023,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651715651.632, "dur": 40.335, "args": { "External id": 22024,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651715707.623, "dur": 48.543, "args": { "External id": 22025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651715765.392, "dur": 32.689, "args": { "External id": 22026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651715808.204, "dur": 44.459, "args": { "External id": 22027,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651715861.080, "dur": 27.560, "args": { "External id": 22028,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651715895.541, "dur": 41.901, "args": { "External id": 22029,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4620 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651715964.705, "dur": 60.681, "args": { "External id": 22030,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4621 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651716046.848, "dur": 31.719, "args": { "External id": 22031,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4622 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651716103.687, "dur": 21.340, "args": { "External id": 22032,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651716139.684, "dur": 14.330, "args": { "External id": 22033,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716162.822, "dur": 33.225, "args": { "External id": 22034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716199.635, "dur": 47.843, "args": { "External id": 22035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4626 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651716276.994, "dur": 175.893, "args": { "External id": 22036,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651716358.646, "dur": 6.449, "args": { "External id": 22037,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651716366.832, "dur": 3.987, "args": { "External id": 22038,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4629 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651716486.278, "dur": 25.064, "args": { "External id": 22039,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4630 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651716521.626, "dur": 13.636, "args": { "External id": 22040,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716542.348, "dur": 40.693, "args": { "External id": 22041,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716588.951, "dur": 34.214, "args": { "External id": 22042,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716632.976, "dur": 20.406, "args": { "External id": 22043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716657.448, "dur": 32.819, "args": { "External id": 22044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716696.141, "dur": 33.747, "args": { "External id": 22045,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651716742.396, "dur": 44.213, "args": { "External id": 22046,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4637 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651716807.024, "dur": 24.390, "args": { "External id": 22047,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4638 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651716849.037, "dur": 23.482, "args": { "External id": 22048,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651716892.770, "dur": 15.497, "args": { "External id": 22049,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4640 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651716922.041, "dur": 16.529, "args": { "External id": 22050,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651716952.081, "dur": 14.315, "args": { "External id": 22051,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4642 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717077.222, "dur": 14.942, "args": { "External id": 22052,"Record function id": 0, "Ev Idx": 4643 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717080.609, "dur": 10.676, "args": { "External id": 22053,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717084.351, "dur": 6.106, "args": { "External id": 22054,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4645 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717085.910, "dur": 4.433, "args": { "External id": 22055,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4646 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717096.070, "dur": 4.288, "args": { "External id": 22056,"Record function id": 0, "Ev Idx": 4647 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717097.330, "dur": 2.580, "args": { "External id": 22057,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717098.207, "dur": 1.253, "args": { "External id": 22058,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4649 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717098.578, "dur": 0.805, "args": { "External id": 22059,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4650 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717103.795, "dur": 7.236, "args": { "External id": 22060,"Record function id": 0, "Ev Idx": 4651 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717107.923, "dur": 2.702, "args": { "External id": 22061,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717108.898, "dur": 1.318, "args": { "External id": 22062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4653 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717109.441, "dur": 0.713, "args": { "External id": 22063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4654 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717114.270, "dur": 3.973, "args": { "External id": 22064,"Record function id": 0, "Ev Idx": 4655 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717115.427, "dur": 2.408, "args": { "External id": 22065,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717116.349, "dur": 1.074, "args": { "External id": 22066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4657 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717116.650, "dur": 0.692, "args": { "External id": 22067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4658 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717121.282, "dur": 5.204, "args": { "External id": 22068,"Record function id": 0, "Ev Idx": 4659 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717122.540, "dur": 3.505, "args": { "External id": 22069,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717123.352, "dur": 2.255, "args": { "External id": 22070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4661 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717124.012, "dur": 1.489, "args": { "External id": 22071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4662 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717129.585, "dur": 6.136, "args": { "External id": 22072,"Record function id": 0, "Ev Idx": 4663 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717130.609, "dur": 4.703, "args": { "External id": 22073,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717131.123, "dur": 3.754, "args": { "External id": 22074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4665 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717133.911, "dur": 0.897, "args": { "External id": 22075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4666 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717138.910, "dur": 3.204, "args": { "External id": 22076,"Record function id": 0, "Ev Idx": 4667 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717139.884, "dur": 1.829, "args": { "External id": 22077,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717140.329, "dur": 0.971, "args": { "External id": 22078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4669 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717140.627, "dur": 0.607, "args": { "External id": 22079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4670 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717145.236, "dur": 3.354, "args": { "External id": 22080,"Record function id": 0, "Ev Idx": 4671 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717146.116, "dur": 2.073, "args": { "External id": 22081,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717146.603, "dur": 1.148, "args": { "External id": 22082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4673 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717146.978, "dur": 0.705, "args": { "External id": 22083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4674 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717151.679, "dur": 3.338, "args": { "External id": 22084,"Record function id": 0, "Ev Idx": 4675 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651717152.740, "dur": 1.872, "args": { "External id": 22085,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717153.359, "dur": 0.834, "args": { "External id": 22086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4677 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651717153.687, "dur": 0.442, "args": { "External id": 22087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4678 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651717158.692, "dur": 35585.394, "args": { "External id": 22088,"Record function id": 0, "Sequence number": 246555, "Fwd thread id": 1, "Ev Idx": 4679 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651717159.882, "dur": 35574.642, "args": { "External id": 22089,"Sequence number": 246555, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4680 } }, { "ph": "f", "id": 213, "pid": 1336754, "tid": 1381179, "ts": 1295651717159.882, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651717193.888, "dur": 50.426, "args": { "External id": 22090,"Record function id": 0, "Ev Idx": 4681 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651717254.652, "dur": 69.108, "args": { "External id": 22091,"Record function id": 0, "Ev Idx": 4682 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.7)", "pid": 1336754, "tid": 1381179, "ts": 1295651717329.876, "dur": 35396.595, "args": { "External id": 22092,"Record function id": 0, "Ev Idx": 4683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651717417.703, "dur": 6.870, "args": { "External id": 22093,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651717434.861, "dur": 5.002, "args": { "External id": 22094,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4685 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651717454.330, "dur": 34467.928, "args": { "External id": 22095,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651717467.601, "dur": 34440.308, "args": { "External id": 22096,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651717509.089, "dur": 17.916, "args": { "External id": 22097,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651717533.529, "dur": 34335.388, "args": { "External id": 22098,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651717535.892, "dur": 34331.906, "args": { "External id": 22099,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651717539.552, "dur": 4.756, "args": { "External id": 22100,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651717548.120, "dur": 34314.949, "args": { "External id": 22101,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651752047.698, "dur": 11.040, "args": { "External id": 22102,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651752050.908, "dur": 7.246, "args": { "External id": 22103,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4694 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651752088.680, "dur": 352.119, "args": { "External id": 22104,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4695 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651752117.811, "dur": 318.273, "args": { "External id": 22105,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4696, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651752129.046, "dur": 301.252, "args": { "External id": 22106,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4697 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651752465.560, "dur": 2.458, "args": { "External id": 22107,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4698, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752525.554, "dur": 6.773, "args": { "External id": 22108,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752577.757, "dur": 1.285, "args": { "External id": 22109,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752593.824, "dur": 1.361, "args": { "External id": 22110,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752605.469, "dur": 1.331, "args": { "External id": 22111,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752617.402, "dur": 0.985, "args": { "External id": 22112,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752627.875, "dur": 0.841, "args": { "External id": 22113,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752639.257, "dur": 0.931, "args": { "External id": 22114,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752650.423, "dur": 0.921, "args": { "External id": 22115,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752663.236, "dur": 0.986, "args": { "External id": 22116,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4707 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651752757.987, "dur": 2818.509, "args": { "External id": 22117,"Record function id": 0, "Ev Idx": 4708 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651752778.199, "dur": 1052.022, "args": { "External id": 22118,"Record function id": 0, "Ev Idx": 4709 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651752792.470, "dur": 367.177, "args": { "External id": 22119,"Record function id": 0, "Ev Idx": 4710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752875.729, "dur": 4.459, "args": { "External id": 22120,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752883.174, "dur": 1.007, "args": { "External id": 22121,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752885.870, "dur": 1.429, "args": { "External id": 22122,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752888.821, "dur": 0.858, "args": { "External id": 22123,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752893.044, "dur": 1.273, "args": { "External id": 22124,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752895.656, "dur": 0.835, "args": { "External id": 22125,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752898.045, "dur": 0.705, "args": { "External id": 22126,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752900.123, "dur": 1.297, "args": { "External id": 22127,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752905.500, "dur": 0.962, "args": { "External id": 22128,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651752907.638, "dur": 1.435, "args": { "External id": 22129,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4720 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651752925.929, "dur": 199.126, "args": { "External id": 22130,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651752942.276, "dur": 174.068, "args": { "External id": 22131,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651752956.974, "dur": 12.202, "args": { "External id": 22132,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651752972.284, "dur": 115.985, "args": { "External id": 22133,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651752974.825, "dur": 113.044, "args": { "External id": 22134,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651752980.455, "dur": 45.267, "args": { "External id": 22135,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651753028.337, "dur": 58.972, "args": { "External id": 22136,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.5", "pid": 1336754, "tid": 1381179, "ts": 1295651753272.139, "dur": 550.731, "args": { "External id": 22137,"Record function id": 0, "Ev Idx": 4728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651753290.300, "dur": 520.802, "args": { "External id": 22138,"Record function id": 0, "Ev Idx": 4729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651753356.968, "dur": 6.239, "args": { "External id": 22139,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651753379.882, "dur": 24.016, "args": { "External id": 22140,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753384.639, "dur": 1.853, "args": { "External id": 22141,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753388.116, "dur": 0.308, "args": { "External id": 22142,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753389.852, "dur": 0.418, "args": { "External id": 22143,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753391.471, "dur": 0.310, "args": { "External id": 22144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753394.042, "dur": 0.398, "args": { "External id": 22145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753395.566, "dur": 0.356, "args": { "External id": 22146,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753396.679, "dur": 0.229, "args": { "External id": 22147,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753398.722, "dur": 0.736, "args": { "External id": 22148,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753400.214, "dur": 0.378, "args": { "External id": 22149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651753414.303, "dur": 31.646, "args": { "External id": 22150,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651753476.585, "dur": 105.938, "args": { "External id": 22151,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651753489.646, "dur": 3.206, "args": { "External id": 22152,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651753497.751, "dur": 10.036, "args": { "External id": 22153,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651753501.806, "dur": 5.575, "args": { "External id": 22154,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753505.312, "dur": 0.820, "args": { "External id": 22155,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651753514.258, "dur": 21.517, "args": { "External id": 22156,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753515.985, "dur": 0.440, "args": { "External id": 22157,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753517.782, "dur": 0.883, "args": { "External id": 22158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753521.894, "dur": 0.403, "args": { "External id": 22159,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753523.071, "dur": 0.192, "args": { "External id": 22160,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753524.330, "dur": 0.964, "args": { "External id": 22161,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753526.503, "dur": 0.464, "args": { "External id": 22162,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753527.733, "dur": 0.172, "args": { "External id": 22163,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753528.716, "dur": 1.040, "args": { "External id": 22164,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651753531.026, "dur": 0.350, "args": { "External id": 22165,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651753552.659, "dur": 16.848, "args": { "External id": 22166,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4757 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651753625.567, "dur": 112.766, "args": { "External id": 22167,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4758 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651753651.431, "dur": 83.719, "args": { "External id": 22168,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4759, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651753660.164, "dur": 71.064, "args": { "External id": 22169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4760 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651753757.850, "dur": 1.929, "args": { "External id": 22170,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4761, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651753839.740, "dur": 1713.948, "args": { "External id": 22171,"Sequence number": 246554, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4762 } }, { "ph": "f", "id": 214, "pid": 1336754, "tid": 1381179, "ts": 1295651753839.740, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651753952.156, "dur": 153.446, "args": { "External id": 22172,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4763 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651754152.730, "dur": 41.905, "args": { "External id": 22173,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651754212.318, "dur": 69.915, "args": { "External id": 22174,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754294.990, "dur": 34.875, "args": { "External id": 22175,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754337.221, "dur": 46.267, "args": { "External id": 22176,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754391.578, "dur": 27.635, "args": { "External id": 22177,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754427.366, "dur": 43.157, "args": { "External id": 22178,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4769 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651754498.703, "dur": 24.308, "args": { "External id": 22179,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4770 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651754541.144, "dur": 28.387, "args": { "External id": 22180,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4771 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651754593.267, "dur": 19.916, "args": { "External id": 22181,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651754628.331, "dur": 14.524, "args": { "External id": 22182,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754652.147, "dur": 30.000, "args": { "External id": 22183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651754685.354, "dur": 36.748, "args": { "External id": 22184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4775 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651754755.123, "dur": 172.412, "args": { "External id": 22185,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651754837.939, "dur": 5.416, "args": { "External id": 22186,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651754845.436, "dur": 2.390, "args": { "External id": 22187,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4778 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651754961.199, "dur": 64.881, "args": { "External id": 22188,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4779 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651755041.609, "dur": 15.420, "args": { "External id": 22189,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755067.233, "dur": 41.927, "args": { "External id": 22190,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755115.072, "dur": 35.912, "args": { "External id": 22191,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755157.226, "dur": 20.715, "args": { "External id": 22192,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755182.197, "dur": 29.385, "args": { "External id": 22193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755217.483, "dur": 47.167, "args": { "External id": 22194,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651755283.592, "dur": 43.789, "args": { "External id": 22195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4786 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651755351.018, "dur": 27.486, "args": { "External id": 22196,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4787 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651755398.288, "dur": 25.942, "args": { "External id": 22197,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4788 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651755442.720, "dur": 16.708, "args": { "External id": 22198,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4789 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651755475.441, "dur": 16.932, "args": { "External id": 22199,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4790 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651755506.812, "dur": 14.834, "args": { "External id": 22200,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4791 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755598.978, "dur": 18.625, "args": { "External id": 22201,"Record function id": 0, "Ev Idx": 4792 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755605.270, "dur": 11.422, "args": { "External id": 22202,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755609.473, "dur": 6.338, "args": { "External id": 22203,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4794 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755611.054, "dur": 4.649, "args": { "External id": 22204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4795 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755621.642, "dur": 4.252, "args": { "External id": 22205,"Record function id": 0, "Ev Idx": 4796 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755622.950, "dur": 2.491, "args": { "External id": 22206,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755623.564, "dur": 1.405, "args": { "External id": 22207,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4798 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755624.023, "dur": 0.870, "args": { "External id": 22208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4799 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755629.139, "dur": 4.867, "args": { "External id": 22209,"Record function id": 0, "Ev Idx": 4800 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755630.824, "dur": 2.743, "args": { "External id": 22210,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755631.444, "dur": 1.638, "args": { "External id": 22211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4802 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755632.070, "dur": 0.909, "args": { "External id": 22212,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4803 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755637.145, "dur": 4.378, "args": { "External id": 22213,"Record function id": 0, "Ev Idx": 4804 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755638.267, "dur": 2.884, "args": { "External id": 22214,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755638.880, "dur": 1.818, "args": { "External id": 22215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4806 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755639.260, "dur": 1.327, "args": { "External id": 22216,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4807 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755644.557, "dur": 4.676, "args": { "External id": 22217,"Record function id": 0, "Ev Idx": 4808 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755645.981, "dur": 2.817, "args": { "External id": 22218,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755646.511, "dur": 1.874, "args": { "External id": 22219,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4810 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755647.323, "dur": 0.995, "args": { "External id": 22220,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4811 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755652.314, "dur": 4.003, "args": { "External id": 22221,"Record function id": 0, "Ev Idx": 4812 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755653.363, "dur": 2.553, "args": { "External id": 22222,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755654.161, "dur": 1.197, "args": { "External id": 22223,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4814 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755654.817, "dur": 0.476, "args": { "External id": 22224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4815 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755662.578, "dur": 3.418, "args": { "External id": 22225,"Record function id": 0, "Ev Idx": 4816 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755663.567, "dur": 2.031, "args": { "External id": 22226,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755664.191, "dur": 0.968, "args": { "External id": 22227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4818 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755664.643, "dur": 0.451, "args": { "External id": 22228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4819 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755668.997, "dur": 5.522, "args": { "External id": 22229,"Record function id": 0, "Ev Idx": 4820 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755670.311, "dur": 3.810, "args": { "External id": 22230,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755670.956, "dur": 2.706, "args": { "External id": 22231,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4822 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755673.083, "dur": 0.478, "args": { "External id": 22232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4823 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755677.472, "dur": 3.130, "args": { "External id": 22233,"Record function id": 0, "Ev Idx": 4824 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651755678.371, "dur": 1.847, "args": { "External id": 22234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755678.822, "dur": 0.985, "args": { "External id": 22235,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4826 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651755679.255, "dur": 0.490, "args": { "External id": 22236,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4827 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651755684.551, "dur": 35408.624, "args": { "External id": 22237,"Record function id": 0, "Sequence number": 246553, "Fwd thread id": 1, "Ev Idx": 4828 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651755685.854, "dur": 35397.426, "args": { "External id": 22238,"Sequence number": 246553, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4829 } }, { "ph": "f", "id": 215, "pid": 1336754, "tid": 1381179, "ts": 1295651755685.854, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651755715.635, "dur": 44.646, "args": { "External id": 22239,"Record function id": 0, "Ev Idx": 4830 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651755768.004, "dur": 73.753, "args": { "External id": 22240,"Record function id": 0, "Ev Idx": 4831 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.6)", "pid": 1336754, "tid": 1381179, "ts": 1295651755847.330, "dur": 35227.099, "args": { "External id": 22241,"Record function id": 0, "Ev Idx": 4832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651755935.919, "dur": 6.449, "args": { "External id": 22242,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651755951.599, "dur": 4.527, "args": { "External id": 22243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4834 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651755970.903, "dur": 34298.309, "args": { "External id": 22244,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651756023.638, "dur": 34236.037, "args": { "External id": 22245,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651756070.406, "dur": 15.942, "args": { "External id": 22246,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651756092.931, "dur": 34117.340, "args": { "External id": 22247,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651756095.555, "dur": 34114.200, "args": { "External id": 22248,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651756098.926, "dur": 6.149, "args": { "External id": 22249,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651756108.988, "dur": 34097.024, "args": { "External id": 22250,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651790363.343, "dur": 11.099, "args": { "External id": 22251,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651790366.196, "dur": 7.819, "args": { "External id": 22252,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4843 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651790402.840, "dur": 343.093, "args": { "External id": 22253,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4844 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651790434.339, "dur": 306.710, "args": { "External id": 22254,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4845, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651790445.353, "dur": 290.535, "args": { "External id": 22255,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4846 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651790766.291, "dur": 2.318, "args": { "External id": 22256,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4847, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790824.383, "dur": 7.009, "args": { "External id": 22257,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790875.434, "dur": 1.940, "args": { "External id": 22258,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790893.750, "dur": 0.919, "args": { "External id": 22259,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790906.055, "dur": 0.907, "args": { "External id": 22260,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790918.481, "dur": 0.959, "args": { "External id": 22261,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790929.500, "dur": 0.836, "args": { "External id": 22262,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790940.265, "dur": 1.146, "args": { "External id": 22263,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790955.104, "dur": 0.916, "args": { "External id": 22264,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651790965.170, "dur": 1.200, "args": { "External id": 22265,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4856 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651791109.503, "dur": 2725.055, "args": { "External id": 22266,"Record function id": 0, "Ev Idx": 4857 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651791129.133, "dur": 1029.461, "args": { "External id": 22267,"Record function id": 0, "Ev Idx": 4858 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651791144.327, "dur": 344.656, "args": { "External id": 22268,"Record function id": 0, "Ev Idx": 4859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791248.892, "dur": 4.785, "args": { "External id": 22269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791257.779, "dur": 1.449, "args": { "External id": 22270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791261.239, "dur": 1.052, "args": { "External id": 22271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791265.749, "dur": 1.200, "args": { "External id": 22272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791268.118, "dur": 1.140, "args": { "External id": 22273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791270.619, "dur": 1.032, "args": { "External id": 22274,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 4865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791273.183, "dur": 1.114, "args": { "External id": 22275,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 4866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791277.446, "dur": 1.051, "args": { "External id": 22276,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791279.764, "dur": 0.845, "args": { "External id": 22277,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651791282.030, "dur": 1.055, "args": { "External id": 22278,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 4869 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651791302.013, "dur": 156.038, "args": { "External id": 22279,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651791320.104, "dur": 133.190, "args": { "External id": 22280,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 4871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651791335.744, "dur": 13.894, "args": { "External id": 22281,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651791352.785, "dur": 69.931, "args": { "External id": 22282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 4873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651791355.358, "dur": 67.058, "args": { "External id": 22283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 4874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791359.298, "dur": 5.997, "args": { "External id": 22284,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651791366.901, "dur": 54.662, "args": { "External id": 22285,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 4876 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.4", "pid": 1336754, "tid": 1381179, "ts": 1295651791583.980, "dur": 566.682, "args": { "External id": 22286,"Record function id": 0, "Ev Idx": 4877 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651791601.662, "dur": 537.020, "args": { "External id": 22287,"Record function id": 0, "Ev Idx": 4878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651791663.193, "dur": 4.796, "args": { "External id": 22288,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651791683.556, "dur": 21.247, "args": { "External id": 22289,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791687.960, "dur": 1.590, "args": { "External id": 22290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791690.804, "dur": 0.472, "args": { "External id": 22291,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791692.172, "dur": 0.513, "args": { "External id": 22292,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791693.914, "dur": 0.207, "args": { "External id": 22293,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791695.448, "dur": 0.823, "args": { "External id": 22294,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791697.470, "dur": 0.585, "args": { "External id": 22295,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791698.981, "dur": 0.547, "args": { "External id": 22296,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791700.200, "dur": 0.704, "args": { "External id": 22297,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791702.053, "dur": 0.342, "args": { "External id": 22298,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651791714.553, "dur": 29.271, "args": { "External id": 22299,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4890 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651791774.432, "dur": 87.540, "args": { "External id": 22300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 4891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651791783.099, "dur": 2.751, "args": { "External id": 22301,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651791790.872, "dur": 10.018, "args": { "External id": 22302,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651791794.732, "dur": 5.734, "args": { "External id": 22303,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 4894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791798.168, "dur": 0.859, "args": { "External id": 22304,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 4895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651791807.145, "dur": 19.963, "args": { "External id": 22305,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 4896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791808.897, "dur": 0.521, "args": { "External id": 22306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791810.820, "dur": 0.445, "args": { "External id": 22307,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791812.669, "dur": 0.977, "args": { "External id": 22308,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791814.998, "dur": 0.254, "args": { "External id": 22309,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791815.852, "dur": 0.477, "args": { "External id": 22310,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791817.437, "dur": 0.672, "args": { "External id": 22311,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791819.389, "dur": 0.546, "args": { "External id": 22312,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791820.544, "dur": 0.333, "args": { "External id": 22313,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651791821.801, "dur": 0.726, "args": { "External id": 22314,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651791836.255, "dur": 18.549, "args": { "External id": 22315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 4906 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651791903.209, "dur": 158.178, "args": { "External id": 22316,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 4907 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651791930.771, "dur": 126.445, "args": { "External id": 22317,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4908, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651791939.238, "dur": 113.153, "args": { "External id": 22318,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 4909 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651792080.474, "dur": 1.880, "args": { "External id": 22319,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4910, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651792166.374, "dur": 1645.903, "args": { "External id": 22320,"Sequence number": 246552, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4911 } }, { "ph": "f", "id": 216, "pid": 1336754, "tid": 1381179, "ts": 1295651792166.374, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792306.735, "dur": 109.528, "args": { "External id": 22321,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 4912 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651792458.293, "dur": 39.969, "args": { "External id": 22322,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 4913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651792514.864, "dur": 51.250, "args": { "External id": 22323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 4914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792575.984, "dur": 34.939, "args": { "External id": 22324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792617.218, "dur": 45.069, "args": { "External id": 22325,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792669.812, "dur": 28.057, "args": { "External id": 22326,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 4917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792707.161, "dur": 42.636, "args": { "External id": 22327,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 4918 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651792774.102, "dur": 20.328, "args": { "External id": 22328,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 4919 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651792814.138, "dur": 29.098, "args": { "External id": 22329,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4920 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651792864.641, "dur": 17.686, "args": { "External id": 22330,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4921 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651792897.915, "dur": 15.328, "args": { "External id": 22331,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792922.141, "dur": 26.762, "args": { "External id": 22332,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651792951.937, "dur": 67.799, "args": { "External id": 22333,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4924 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651793050.416, "dur": 168.517, "args": { "External id": 22334,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 4925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651793127.594, "dur": 6.005, "args": { "External id": 22335,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651793135.582, "dur": 2.193, "args": { "External id": 22336,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4927 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651793277.640, "dur": 27.447, "args": { "External id": 22337,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4928 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651793321.875, "dur": 14.182, "args": { "External id": 22338,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793345.172, "dur": 42.020, "args": { "External id": 22339,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793392.678, "dur": 36.448, "args": { "External id": 22340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793435.870, "dur": 19.978, "args": { "External id": 22341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793460.837, "dur": 29.642, "args": { "External id": 22342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793496.227, "dur": 34.564, "args": { "External id": 22343,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 4934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651793550.074, "dur": 38.846, "args": { "External id": 22344,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 4935 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651793611.386, "dur": 26.981, "args": { "External id": 22345,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 4936 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651793657.078, "dur": 29.420, "args": { "External id": 22346,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 4937 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651793702.565, "dur": 16.033, "args": { "External id": 22347,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 4938 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651793735.240, "dur": 16.529, "args": { "External id": 22348,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 4939 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651793764.710, "dur": 15.573, "args": { "External id": 22349,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 4940 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793856.992, "dur": 17.878, "args": { "External id": 22350,"Record function id": 0, "Ev Idx": 4941 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793863.317, "dur": 10.583, "args": { "External id": 22351,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793867.220, "dur": 5.839, "args": { "External id": 22352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4943 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793868.580, "dur": 4.384, "args": { "External id": 22353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4944 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793878.787, "dur": 4.703, "args": { "External id": 22354,"Record function id": 0, "Ev Idx": 4945 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793880.238, "dur": 2.856, "args": { "External id": 22355,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793881.217, "dur": 1.377, "args": { "External id": 22356,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4947 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793881.844, "dur": 0.675, "args": { "External id": 22357,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4948 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793886.712, "dur": 4.999, "args": { "External id": 22358,"Record function id": 0, "Ev Idx": 4949 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793887.900, "dur": 3.377, "args": { "External id": 22359,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793888.959, "dur": 1.866, "args": { "External id": 22360,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4951 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793889.530, "dur": 1.172, "args": { "External id": 22361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 4952 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793894.956, "dur": 4.423, "args": { "External id": 22362,"Record function id": 0, "Ev Idx": 4953 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793896.220, "dur": 2.783, "args": { "External id": 22363,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793897.503, "dur": 1.069, "args": { "External id": 22364,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4955 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793897.914, "dur": 0.567, "args": { "External id": 22365,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 4956 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793902.513, "dur": 3.552, "args": { "External id": 22366,"Record function id": 0, "Ev Idx": 4957 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793903.530, "dur": 2.115, "args": { "External id": 22367,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793904.016, "dur": 1.165, "args": { "External id": 22368,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4959 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793904.376, "dur": 0.740, "args": { "External id": 22369,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4960 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793909.131, "dur": 3.274, "args": { "External id": 22370,"Record function id": 0, "Ev Idx": 4961 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793910.040, "dur": 1.953, "args": { "External id": 22371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793910.475, "dur": 1.063, "args": { "External id": 22372,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4963 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793910.920, "dur": 0.553, "args": { "External id": 22373,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4964 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793915.611, "dur": 7.466, "args": { "External id": 22374,"Record function id": 0, "Ev Idx": 4965 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793920.616, "dur": 2.051, "args": { "External id": 22375,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793921.072, "dur": 1.146, "args": { "External id": 22376,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4967 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793921.356, "dur": 0.783, "args": { "External id": 22377,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4968 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793926.160, "dur": 3.171, "args": { "External id": 22378,"Record function id": 0, "Ev Idx": 4969 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793927.014, "dur": 1.927, "args": { "External id": 22379,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793927.488, "dur": 0.989, "args": { "External id": 22380,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4971 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793927.769, "dur": 0.641, "args": { "External id": 22381,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 4972 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793932.371, "dur": 5.420, "args": { "External id": 22382,"Record function id": 0, "Ev Idx": 4973 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651793933.204, "dur": 4.208, "args": { "External id": 22383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793933.689, "dur": 3.154, "args": { "External id": 22384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4975 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651793935.896, "dur": 0.767, "args": { "External id": 22385,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 4976 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651793941.470, "dur": 37850.431, "args": { "External id": 22386,"Record function id": 0, "Sequence number": 246551, "Fwd thread id": 1, "Ev Idx": 4977 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651793942.814, "dur": 37839.750, "args": { "External id": 22387,"Sequence number": 246551, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 4978 } }, { "ph": "f", "id": 217, "pid": 1336754, "tid": 1381179, "ts": 1295651793942.814, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651793970.603, "dur": 85.053, "args": { "External id": 22388,"Record function id": 0, "Ev Idx": 4979 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651794065.573, "dur": 71.553, "args": { "External id": 22389,"Record function id": 0, "Ev Idx": 4980 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.5)", "pid": 1336754, "tid": 1381179, "ts": 1295651794143.168, "dur": 37631.593, "args": { "External id": 22390,"Record function id": 0, "Ev Idx": 4981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651794254.999, "dur": 7.932, "args": { "External id": 22391,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651794277.061, "dur": 5.319, "args": { "External id": 22392,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 4983 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651794297.980, "dur": 36581.093, "args": { "External id": 22393,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651794311.409, "dur": 36557.838, "args": { "External id": 22394,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 4985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651794356.123, "dur": 18.044, "args": { "External id": 22395,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651794380.384, "dur": 36446.418, "args": { "External id": 22396,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 4987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651794388.662, "dur": 36437.392, "args": { "External id": 22397,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 4988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651794392.487, "dur": 5.948, "args": { "External id": 22398,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651794400.193, "dur": 36421.308, "args": { "External id": 22399,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 4990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651831036.662, "dur": 12.420, "args": { "External id": 22400,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 4991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651831039.716, "dur": 8.798, "args": { "External id": 22401,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 4992 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651831079.559, "dur": 401.092, "args": { "External id": 22402,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 4993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651831110.534, "dur": 364.965, "args": { "External id": 22403,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 4994, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651831122.771, "dur": 347.015, "args": { "External id": 22404,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 4995 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651831504.935, "dur": 2.463, "args": { "External id": 22405,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 4996, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831570.197, "dur": 7.153, "args": { "External id": 22406,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831625.239, "dur": 1.358, "args": { "External id": 22407,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831644.550, "dur": 1.181, "args": { "External id": 22408,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 4999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831658.001, "dur": 0.896, "args": { "External id": 22409,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831671.272, "dur": 0.786, "args": { "External id": 22410,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831682.122, "dur": 1.070, "args": { "External id": 22411,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831693.823, "dur": 0.816, "args": { "External id": 22412,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831705.046, "dur": 0.887, "args": { "External id": 22413,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651831715.154, "dur": 1.397, "args": { "External id": 22414,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5005 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651831805.723, "dur": 2741.841, "args": { "External id": 22415,"Record function id": 0, "Ev Idx": 5006 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651831825.073, "dur": 1017.860, "args": { "External id": 22416,"Record function id": 0, "Ev Idx": 5007 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651831838.507, "dur": 355.790, "args": { "External id": 22417,"Record function id": 0, "Ev Idx": 5008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831918.768, "dur": 4.489, "args": { "External id": 22418,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831928.686, "dur": 1.566, "args": { "External id": 22419,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831932.279, "dur": 1.009, "args": { "External id": 22420,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831934.872, "dur": 1.090, "args": { "External id": 22421,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831937.240, "dur": 1.432, "args": { "External id": 22422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831941.805, "dur": 1.007, "args": { "External id": 22423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831944.866, "dur": 1.160, "args": { "External id": 22424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831947.273, "dur": 1.181, "args": { "External id": 22425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831949.901, "dur": 0.804, "args": { "External id": 22426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651831954.139, "dur": 0.960, "args": { "External id": 22427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5018 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651831973.122, "dur": 189.900, "args": { "External id": 22428,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651832029.366, "dur": 129.075, "args": { "External id": 22429,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651832045.599, "dur": 13.061, "args": { "External id": 22430,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651832062.132, "dur": 68.585, "args": { "External id": 22431,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651832064.645, "dur": 65.750, "args": { "External id": 22432,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832068.854, "dur": 5.373, "args": { "External id": 22433,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651832075.852, "dur": 54.014, "args": { "External id": 22434,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5025 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.3", "pid": 1336754, "tid": 1381179, "ts": 1295651832312.078, "dur": 523.879, "args": { "External id": 22435,"Record function id": 0, "Ev Idx": 5026 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651832330.028, "dur": 494.056, "args": { "External id": 22436,"Record function id": 0, "Ev Idx": 5027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651832396.574, "dur": 5.962, "args": { "External id": 22437,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651832419.233, "dur": 23.582, "args": { "External id": 22438,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832423.951, "dur": 1.834, "args": { "External id": 22439,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832427.533, "dur": 0.795, "args": { "External id": 22440,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832429.774, "dur": 0.418, "args": { "External id": 22441,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832430.964, "dur": 0.301, "args": { "External id": 22442,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832432.034, "dur": 0.664, "args": { "External id": 22443,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832433.950, "dur": 0.435, "args": { "External id": 22444,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832435.100, "dur": 0.469, "args": { "External id": 22445,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832436.464, "dur": 0.601, "args": { "External id": 22446,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832439.148, "dur": 0.471, "args": { "External id": 22447,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651832453.448, "dur": 33.073, "args": { "External id": 22448,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5039 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651832517.718, "dur": 83.104, "args": { "External id": 22449,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651832527.786, "dur": 3.178, "args": { "External id": 22450,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651832535.539, "dur": 9.203, "args": { "External id": 22451,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651832539.507, "dur": 4.798, "args": { "External id": 22452,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832542.581, "dur": 0.530, "args": { "External id": 22453,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651832551.334, "dur": 15.935, "args": { "External id": 22454,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832553.203, "dur": 0.546, "args": { "External id": 22455,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832554.851, "dur": 0.363, "args": { "External id": 22456,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832555.889, "dur": 0.365, "args": { "External id": 22457,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832556.855, "dur": 0.434, "args": { "External id": 22458,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832558.883, "dur": 0.566, "args": { "External id": 22459,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832560.250, "dur": 0.338, "args": { "External id": 22460,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832561.114, "dur": 0.184, "args": { "External id": 22461,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832561.871, "dur": 0.620, "args": { "External id": 22462,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651832563.441, "dur": 0.328, "args": { "External id": 22463,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651832576.580, "dur": 17.179, "args": { "External id": 22464,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5055 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651832643.477, "dur": 113.901, "args": { "External id": 22465,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5056 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651832671.133, "dur": 83.019, "args": { "External id": 22466,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5057, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651832680.415, "dur": 69.838, "args": { "External id": 22467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5058 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651832773.341, "dur": 1.727, "args": { "External id": 22468,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5059, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651832849.818, "dur": 1673.433, "args": { "External id": 22469,"Sequence number": 246550, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5060 } }, { "ph": "f", "id": 218, "pid": 1336754, "tid": 1381179, "ts": 1295651832849.818, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651832960.703, "dur": 147.471, "args": { "External id": 22470,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651833152.676, "dur": 42.113, "args": { "External id": 22471,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651833212.839, "dur": 78.908, "args": { "External id": 22472,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833304.145, "dur": 37.394, "args": { "External id": 22473,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833347.775, "dur": 47.999, "args": { "External id": 22474,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833402.866, "dur": 28.314, "args": { "External id": 22475,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833439.085, "dur": 41.824, "args": { "External id": 22476,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5067 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651833504.935, "dur": 24.870, "args": { "External id": 22477,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5068 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651833550.490, "dur": 31.023, "args": { "External id": 22478,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5069 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651833603.271, "dur": 21.636, "args": { "External id": 22479,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5070 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651833640.292, "dur": 13.714, "args": { "External id": 22480,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833662.032, "dur": 27.622, "args": { "External id": 22481,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651833692.714, "dur": 34.948, "args": { "External id": 22482,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5073 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651833753.705, "dur": 171.720, "args": { "External id": 22483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651833837.135, "dur": 6.184, "args": { "External id": 22484,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651833845.076, "dur": 2.106, "args": { "External id": 22485,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5076 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651833957.119, "dur": 23.198, "args": { "External id": 22486,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5077 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651834032.041, "dur": 17.562, "args": { "External id": 22487,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834060.414, "dur": 40.530, "args": { "External id": 22488,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834107.090, "dur": 35.056, "args": { "External id": 22489,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834148.973, "dur": 21.026, "args": { "External id": 22490,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834174.806, "dur": 30.919, "args": { "External id": 22491,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834211.582, "dur": 36.019, "args": { "External id": 22492,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651834257.257, "dur": 33.047, "args": { "External id": 22493,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5084 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651834310.060, "dur": 36.816, "args": { "External id": 22494,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5085 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651834371.443, "dur": 23.888, "args": { "External id": 22495,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651834415.939, "dur": 20.232, "args": { "External id": 22496,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5087 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651834451.586, "dur": 13.917, "args": { "External id": 22497,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651834478.804, "dur": 17.778, "args": { "External id": 22498,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5089 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834569.657, "dur": 14.865, "args": { "External id": 22499,"Record function id": 0, "Ev Idx": 5090 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834572.973, "dur": 10.574, "args": { "External id": 22500,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834576.890, "dur": 5.659, "args": { "External id": 22501,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5092 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834578.270, "dur": 4.173, "args": { "External id": 22502,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5093 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834588.464, "dur": 4.755, "args": { "External id": 22503,"Record function id": 0, "Ev Idx": 5094 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834589.911, "dur": 2.863, "args": { "External id": 22504,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834590.646, "dur": 1.648, "args": { "External id": 22505,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5096 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834591.320, "dur": 0.900, "args": { "External id": 22506,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5097 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834599.545, "dur": 3.801, "args": { "External id": 22507,"Record function id": 0, "Ev Idx": 5098 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834600.622, "dur": 2.293, "args": { "External id": 22508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834601.195, "dur": 1.230, "args": { "External id": 22509,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5100 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834601.704, "dur": 0.645, "args": { "External id": 22510,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5101 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834606.651, "dur": 4.223, "args": { "External id": 22511,"Record function id": 0, "Ev Idx": 5102 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834608.053, "dur": 2.384, "args": { "External id": 22512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834608.532, "dur": 1.469, "args": { "External id": 22513,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5104 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834608.818, "dur": 1.116, "args": { "External id": 22514,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5105 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834613.984, "dur": 3.661, "args": { "External id": 22515,"Record function id": 0, "Ev Idx": 5106 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834615.175, "dur": 2.044, "args": { "External id": 22516,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834615.659, "dur": 1.121, "args": { "External id": 22517,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5108 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834616.124, "dur": 0.582, "args": { "External id": 22518,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5109 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834620.728, "dur": 5.870, "args": { "External id": 22519,"Record function id": 0, "Ev Idx": 5110 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834621.943, "dur": 4.236, "args": { "External id": 22520,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834622.609, "dur": 3.127, "args": { "External id": 22521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5112 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834625.096, "dur": 0.578, "args": { "External id": 22522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5113 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834629.796, "dur": 3.460, "args": { "External id": 22523,"Record function id": 0, "Ev Idx": 5114 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834630.914, "dur": 1.900, "args": { "External id": 22524,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834631.404, "dur": 0.960, "args": { "External id": 22525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5116 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834631.697, "dur": 0.594, "args": { "External id": 22526,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5117 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834636.349, "dur": 26.280, "args": { "External id": 22527,"Record function id": 0, "Ev Idx": 5118 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834637.223, "dur": 24.969, "args": { "External id": 22528,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834660.372, "dur": 1.182, "args": { "External id": 22529,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5120 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834660.813, "dur": 0.676, "args": { "External id": 22530,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5121 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834665.886, "dur": 5.820, "args": { "External id": 22531,"Record function id": 0, "Ev Idx": 5122 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651834667.127, "dur": 4.141, "args": { "External id": 22532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834667.628, "dur": 3.177, "args": { "External id": 22533,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5124 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651834670.145, "dur": 0.546, "args": { "External id": 22534,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5125 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651834675.384, "dur": 35510.599, "args": { "External id": 22535,"Record function id": 0, "Sequence number": 246549, "Fwd thread id": 1, "Ev Idx": 5126 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651834676.801, "dur": 35499.600, "args": { "External id": 22536,"Sequence number": 246549, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5127 } }, { "ph": "f", "id": 219, "pid": 1336754, "tid": 1381179, "ts": 1295651834676.801, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651834706.178, "dur": 40.370, "args": { "External id": 22537,"Record function id": 0, "Ev Idx": 5128 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651834753.788, "dur": 68.192, "args": { "External id": 22538,"Record function id": 0, "Ev Idx": 5129 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.4)", "pid": 1336754, "tid": 1381179, "ts": 1295651834828.103, "dur": 35340.398, "args": { "External id": 22539,"Record function id": 0, "Ev Idx": 5130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651834917.586, "dur": 6.549, "args": { "External id": 22540,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651834933.801, "dur": 4.389, "args": { "External id": 22541,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651834952.589, "dur": 34413.726, "args": { "External id": 22542,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651834969.763, "dur": 34387.595, "args": { "External id": 22543,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651835055.465, "dur": 16.143, "args": { "External id": 22544,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651835078.144, "dur": 34238.644, "args": { "External id": 22545,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651835080.629, "dur": 34235.494, "args": { "External id": 22546,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651835084.093, "dur": 6.773, "args": { "External id": 22547,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651835094.739, "dur": 34217.905, "args": { "External id": 22548,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651869457.981, "dur": 9.364, "args": { "External id": 22549,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651869460.663, "dur": 6.302, "args": { "External id": 22550,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5141 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651869495.499, "dur": 339.149, "args": { "External id": 22551,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5142 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651869523.368, "dur": 306.862, "args": { "External id": 22552,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5143, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651869534.583, "dur": 290.485, "args": { "External id": 22553,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5144 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651869852.619, "dur": 2.273, "args": { "External id": 22554,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5145, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651869906.594, "dur": 6.577, "args": { "External id": 22555,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651869958.681, "dur": 1.561, "args": { "External id": 22556,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651869976.421, "dur": 1.464, "args": { "External id": 22557,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870043.314, "dur": 1.593, "args": { "External id": 22558,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870056.479, "dur": 1.071, "args": { "External id": 22559,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870068.218, "dur": 1.013, "args": { "External id": 22560,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870079.797, "dur": 1.289, "args": { "External id": 22561,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870091.770, "dur": 1.360, "args": { "External id": 22562,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870106.194, "dur": 1.281, "args": { "External id": 22563,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5154 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651870201.204, "dur": 2697.893, "args": { "External id": 22564,"Record function id": 0, "Ev Idx": 5155 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651870221.304, "dur": 1030.425, "args": { "External id": 22565,"Record function id": 0, "Ev Idx": 5156 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651870252.607, "dur": 318.627, "args": { "External id": 22566,"Record function id": 0, "Ev Idx": 5157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870339.440, "dur": 4.824, "args": { "External id": 22567,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870347.587, "dur": 1.320, "args": { "External id": 22568,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870350.425, "dur": 1.307, "args": { "External id": 22569,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870355.243, "dur": 1.125, "args": { "External id": 22570,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870357.742, "dur": 1.209, "args": { "External id": 22571,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870360.188, "dur": 1.275, "args": { "External id": 22572,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870362.971, "dur": 1.055, "args": { "External id": 22573,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870367.112, "dur": 0.795, "args": { "External id": 22574,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870369.240, "dur": 1.477, "args": { "External id": 22575,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651870372.267, "dur": 0.909, "args": { "External id": 22576,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5167 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651870390.660, "dur": 153.018, "args": { "External id": 22577,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651870406.758, "dur": 132.386, "args": { "External id": 22578,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651870423.950, "dur": 13.088, "args": { "External id": 22579,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651870440.319, "dur": 71.828, "args": { "External id": 22580,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651870443.133, "dur": 68.643, "args": { "External id": 22581,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870447.365, "dur": 5.952, "args": { "External id": 22582,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651870457.143, "dur": 53.984, "args": { "External id": 22583,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5174 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.2", "pid": 1336754, "tid": 1381179, "ts": 1295651870664.670, "dur": 560.885, "args": { "External id": 22584,"Record function id": 0, "Ev Idx": 5175 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651870680.150, "dur": 533.382, "args": { "External id": 22585,"Record function id": 0, "Ev Idx": 5176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651870746.723, "dur": 4.551, "args": { "External id": 22586,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651870766.787, "dur": 21.418, "args": { "External id": 22587,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870771.611, "dur": 1.459, "args": { "External id": 22588,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870774.552, "dur": 0.568, "args": { "External id": 22589,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870776.485, "dur": 0.756, "args": { "External id": 22590,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870778.102, "dur": 0.200, "args": { "External id": 22591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870780.113, "dur": 0.573, "args": { "External id": 22592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870781.401, "dur": 0.209, "args": { "External id": 22593,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870782.687, "dur": 0.183, "args": { "External id": 22594,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870783.386, "dur": 0.831, "args": { "External id": 22595,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870785.400, "dur": 0.331, "args": { "External id": 22596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651870797.268, "dur": 30.450, "args": { "External id": 22597,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651870857.302, "dur": 88.666, "args": { "External id": 22598,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651870866.623, "dur": 3.458, "args": { "External id": 22599,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651870875.112, "dur": 9.946, "args": { "External id": 22600,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651870879.670, "dur": 4.960, "args": { "External id": 22601,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870882.818, "dur": 0.544, "args": { "External id": 22602,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651870891.568, "dur": 20.109, "args": { "External id": 22603,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870893.124, "dur": 1.194, "args": { "External id": 22604,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870896.164, "dur": 0.387, "args": { "External id": 22605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870898.017, "dur": 0.401, "args": { "External id": 22606,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870899.156, "dur": 0.343, "args": { "External id": 22607,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870900.732, "dur": 0.765, "args": { "External id": 22608,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870902.560, "dur": 0.174, "args": { "External id": 22609,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870903.277, "dur": 0.465, "args": { "External id": 22610,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870904.378, "dur": 1.173, "args": { "External id": 22611,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651870906.720, "dur": 0.582, "args": { "External id": 22612,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651870920.671, "dur": 18.362, "args": { "External id": 22613,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5204 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651871028.633, "dur": 116.051, "args": { "External id": 22614,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5205 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651871054.675, "dur": 86.728, "args": { "External id": 22615,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5206, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651871064.661, "dur": 72.930, "args": { "External id": 22616,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5207 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651871161.400, "dur": 2.186, "args": { "External id": 22617,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5208, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651871260.768, "dur": 1615.933, "args": { "External id": 22618,"Sequence number": 246548, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5209 } }, { "ph": "f", "id": 220, "pid": 1336754, "tid": 1381179, "ts": 1295651871260.768, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651871371.853, "dur": 112.524, "args": { "External id": 22619,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5210 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651871525.234, "dur": 41.979, "args": { "External id": 22620,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651871584.108, "dur": 48.723, "args": { "External id": 22621,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651871641.833, "dur": 33.720, "args": { "External id": 22622,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651871682.657, "dur": 45.458, "args": { "External id": 22623,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651871735.466, "dur": 29.334, "args": { "External id": 22624,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651871773.327, "dur": 42.988, "args": { "External id": 22625,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5216 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651871841.958, "dur": 24.222, "args": { "External id": 22626,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5217 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651871886.644, "dur": 29.387, "args": { "External id": 22627,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5218 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651871936.377, "dur": 21.104, "args": { "External id": 22628,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651871972.057, "dur": 59.347, "args": { "External id": 22629,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872043.856, "dur": 38.837, "args": { "External id": 22630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872086.430, "dur": 34.378, "args": { "External id": 22631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5222 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651872151.460, "dur": 189.042, "args": { "External id": 22632,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651872246.959, "dur": 7.380, "args": { "External id": 22633,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651872256.511, "dur": 2.311, "args": { "External id": 22634,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5225 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651872375.226, "dur": 25.774, "args": { "External id": 22635,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5226 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651872412.748, "dur": 13.526, "args": { "External id": 22636,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872434.170, "dur": 39.588, "args": { "External id": 22637,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872479.715, "dur": 34.471, "args": { "External id": 22638,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872521.087, "dur": 20.870, "args": { "External id": 22639,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872546.649, "dur": 29.594, "args": { "External id": 22640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872582.226, "dur": 33.424, "args": { "External id": 22641,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651872628.723, "dur": 39.212, "args": { "External id": 22642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5233 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651872689.536, "dur": 25.086, "args": { "External id": 22643,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5234 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651872734.221, "dur": 26.391, "args": { "External id": 22644,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5235 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651872776.523, "dur": 16.680, "args": { "External id": 22645,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5236 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651872807.898, "dur": 13.478, "args": { "External id": 22646,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5237 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651872835.818, "dur": 13.753, "args": { "External id": 22647,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5238 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872921.140, "dur": 15.322, "args": { "External id": 22648,"Record function id": 0, "Ev Idx": 5239 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872924.213, "dur": 11.457, "args": { "External id": 22649,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872928.492, "dur": 6.262, "args": { "External id": 22650,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5241 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872930.178, "dur": 4.469, "args": { "External id": 22651,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5242 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872940.185, "dur": 5.297, "args": { "External id": 22652,"Record function id": 0, "Ev Idx": 5243 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872942.001, "dur": 3.027, "args": { "External id": 22653,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872943.078, "dur": 1.383, "args": { "External id": 22654,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5245 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872943.589, "dur": 0.778, "args": { "External id": 22655,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5246 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872948.831, "dur": 5.057, "args": { "External id": 22656,"Record function id": 0, "Ev Idx": 5247 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872950.207, "dur": 3.264, "args": { "External id": 22657,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872951.061, "dur": 1.946, "args": { "External id": 22658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5249 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872952.008, "dur": 0.898, "args": { "External id": 22659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5250 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872957.099, "dur": 3.811, "args": { "External id": 22660,"Record function id": 0, "Ev Idx": 5251 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872958.143, "dur": 2.394, "args": { "External id": 22661,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872958.831, "dur": 1.245, "args": { "External id": 22662,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5253 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872959.300, "dur": 0.669, "args": { "External id": 22663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5254 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872963.975, "dur": 3.887, "args": { "External id": 22664,"Record function id": 0, "Ev Idx": 5255 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872965.268, "dur": 2.189, "args": { "External id": 22665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872965.814, "dur": 1.220, "args": { "External id": 22666,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5257 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872966.200, "dur": 0.772, "args": { "External id": 22667,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5258 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872970.953, "dur": 4.492, "args": { "External id": 22668,"Record function id": 0, "Ev Idx": 5259 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872972.156, "dur": 2.858, "args": { "External id": 22669,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872973.067, "dur": 1.531, "args": { "External id": 22670,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5261 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872973.483, "dur": 1.046, "args": { "External id": 22671,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5262 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872978.627, "dur": 44.944, "args": { "External id": 22672,"Record function id": 0, "Ev Idx": 5263 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651872979.732, "dur": 42.541, "args": { "External id": 22673,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651872980.193, "dur": 40.862, "args": { "External id": 22674,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5265 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651873019.178, "dur": 1.573, "args": { "External id": 22675,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5266 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651873028.939, "dur": 8.016, "args": { "External id": 22676,"Record function id": 0, "Ev Idx": 5267 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651873030.418, "dur": 6.080, "args": { "External id": 22677,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651873034.515, "dur": 1.501, "args": { "External id": 22678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5269 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651873035.046, "dur": 0.904, "args": { "External id": 22679,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5270 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651873040.042, "dur": 9.234, "args": { "External id": 22680,"Record function id": 0, "Ev Idx": 5271 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651873040.949, "dur": 7.914, "args": { "External id": 22681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651873041.485, "dur": 6.778, "args": { "External id": 22682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5273 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651873047.549, "dur": 0.646, "args": { "External id": 22683,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5274 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651873052.897, "dur": 35590.738, "args": { "External id": 22684,"Record function id": 0, "Sequence number": 246547, "Fwd thread id": 1, "Ev Idx": 5275 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651873054.043, "dur": 35580.654, "args": { "External id": 22685,"Sequence number": 246547, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5276 } }, { "ph": "f", "id": 221, "pid": 1336754, "tid": 1381179, "ts": 1295651873054.043, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651873087.017, "dur": 42.953, "args": { "External id": 22686,"Record function id": 0, "Ev Idx": 5277 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651873137.690, "dur": 69.231, "args": { "External id": 22687,"Record function id": 0, "Ev Idx": 5278 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.3)", "pid": 1336754, "tid": 1381179, "ts": 1295651873212.896, "dur": 35414.263, "args": { "External id": 22688,"Record function id": 0, "Ev Idx": 5279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651873324.922, "dur": 7.458, "args": { "External id": 22689,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651873343.199, "dur": 5.121, "args": { "External id": 22690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5281 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651873363.597, "dur": 34444.231, "args": { "External id": 22691,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651873379.100, "dur": 34420.158, "args": { "External id": 22692,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651873420.483, "dur": 17.258, "args": { "External id": 22693,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651873447.157, "dur": 34315.344, "args": { "External id": 22694,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651873449.544, "dur": 34312.357, "args": { "External id": 22695,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651873452.900, "dur": 5.839, "args": { "External id": 22696,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651873460.413, "dur": 34297.897, "args": { "External id": 22697,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651907898.422, "dur": 8.722, "args": { "External id": 22698,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651907901.102, "dur": 5.751, "args": { "External id": 22699,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5290 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651907934.338, "dur": 399.126, "args": { "External id": 22700,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5291 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651907964.923, "dur": 363.553, "args": { "External id": 22701,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5292, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651907975.611, "dur": 346.590, "args": { "External id": 22702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5293 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651908357.263, "dur": 2.387, "args": { "External id": 22703,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5294, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908421.728, "dur": 6.979, "args": { "External id": 22704,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908473.827, "dur": 1.286, "args": { "External id": 22705,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908492.010, "dur": 1.435, "args": { "External id": 22706,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908505.033, "dur": 1.067, "args": { "External id": 22707,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908516.681, "dur": 0.973, "args": { "External id": 22708,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908528.428, "dur": 0.858, "args": { "External id": 22709,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908540.651, "dur": 1.220, "args": { "External id": 22710,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908555.449, "dur": 1.227, "args": { "External id": 22711,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908566.395, "dur": 0.951, "args": { "External id": 22712,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5303 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651908658.110, "dur": 2764.417, "args": { "External id": 22713,"Record function id": 0, "Ev Idx": 5304 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651908678.908, "dur": 1036.183, "args": { "External id": 22714,"Record function id": 0, "Ev Idx": 5305 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651908693.540, "dur": 360.642, "args": { "External id": 22715,"Record function id": 0, "Ev Idx": 5306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908776.705, "dur": 4.480, "args": { "External id": 22716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908784.418, "dur": 1.042, "args": { "External id": 22717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908787.285, "dur": 0.992, "args": { "External id": 22718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908791.792, "dur": 0.976, "args": { "External id": 22719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908794.435, "dur": 0.968, "args": { "External id": 22720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908796.796, "dur": 0.864, "args": { "External id": 22721,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908799.122, "dur": 1.117, "args": { "External id": 22722,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908803.737, "dur": 1.026, "args": { "External id": 22723,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908806.022, "dur": 0.991, "args": { "External id": 22724,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651908808.383, "dur": 1.299, "args": { "External id": 22725,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5316 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651908827.404, "dur": 152.953, "args": { "External id": 22726,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651908842.941, "dur": 132.951, "args": { "External id": 22727,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651908859.939, "dur": 14.264, "args": { "External id": 22728,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651908877.465, "dur": 70.645, "args": { "External id": 22729,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651908880.173, "dur": 67.642, "args": { "External id": 22730,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651908883.623, "dur": 5.393, "args": { "External id": 22731,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651908892.967, "dur": 54.347, "args": { "External id": 22732,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5323 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.1", "pid": 1336754, "tid": 1381179, "ts": 1295651909153.274, "dur": 554.358, "args": { "External id": 22733,"Record function id": 0, "Ev Idx": 5324 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651909170.412, "dur": 524.933, "args": { "External id": 22734,"Record function id": 0, "Ev Idx": 5325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651909251.794, "dur": 6.755, "args": { "External id": 22735,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651909281.982, "dur": 27.658, "args": { "External id": 22736,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909289.989, "dur": 1.706, "args": { "External id": 22737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909294.207, "dur": 0.352, "args": { "External id": 22738,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909295.843, "dur": 0.514, "args": { "External id": 22739,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909298.019, "dur": 0.403, "args": { "External id": 22740,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909299.485, "dur": 0.167, "args": { "External id": 22741,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909301.635, "dur": 0.291, "args": { "External id": 22742,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909302.657, "dur": 0.298, "args": { "External id": 22743,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909304.268, "dur": 0.166, "args": { "External id": 22744,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909305.382, "dur": 0.395, "args": { "External id": 22745,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651909320.441, "dur": 34.920, "args": { "External id": 22746,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5337 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651909386.756, "dur": 89.075, "args": { "External id": 22747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651909396.978, "dur": 3.378, "args": { "External id": 22748,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651909405.381, "dur": 9.769, "args": { "External id": 22749,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651909409.688, "dur": 5.058, "args": { "External id": 22750,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909412.914, "dur": 0.544, "args": { "External id": 22751,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651909421.428, "dur": 20.428, "args": { "External id": 22752,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909422.921, "dur": 0.402, "args": { "External id": 22753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909425.214, "dur": 0.807, "args": { "External id": 22754,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909426.910, "dur": 0.217, "args": { "External id": 22755,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909427.880, "dur": 0.395, "args": { "External id": 22756,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909429.305, "dur": 0.587, "args": { "External id": 22757,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909431.354, "dur": 0.382, "args": { "External id": 22758,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909434.901, "dur": 0.329, "args": { "External id": 22759,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909436.110, "dur": 0.556, "args": { "External id": 22760,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651909437.609, "dur": 0.673, "args": { "External id": 22761,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651909451.102, "dur": 17.447, "args": { "External id": 22762,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5353 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651909519.124, "dur": 112.658, "args": { "External id": 22763,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5354 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651909546.660, "dur": 81.525, "args": { "External id": 22764,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5355, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651909556.220, "dur": 68.086, "args": { "External id": 22765,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5356 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651909647.796, "dur": 1.773, "args": { "External id": 22766,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5357, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651909722.923, "dur": 1676.372, "args": { "External id": 22767,"Sequence number": 246546, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5358 } }, { "ph": "f", "id": 222, "pid": 1336754, "tid": 1381179, "ts": 1295651909722.923, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651909831.679, "dur": 102.262, "args": { "External id": 22768,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5359 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651909972.588, "dur": 80.155, "args": { "External id": 22769,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651910076.317, "dur": 59.120, "args": { "External id": 22770,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910144.920, "dur": 33.160, "args": { "External id": 22771,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910184.987, "dur": 60.287, "args": { "External id": 22772,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910255.592, "dur": 32.826, "args": { "External id": 22773,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910296.748, "dur": 42.314, "args": { "External id": 22774,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5365 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651910366.164, "dur": 27.080, "args": { "External id": 22775,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5366 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651910413.884, "dur": 27.857, "args": { "External id": 22776,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5367 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651910461.279, "dur": 25.078, "args": { "External id": 22777,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5368 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651910501.053, "dur": 14.339, "args": { "External id": 22778,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910523.412, "dur": 29.240, "args": { "External id": 22779,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910556.083, "dur": 32.610, "args": { "External id": 22780,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5371 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651910614.703, "dur": 164.701, "args": { "External id": 22781,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651910691.373, "dur": 6.284, "args": { "External id": 22782,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651910699.555, "dur": 1.912, "args": { "External id": 22783,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5374 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651910814.090, "dur": 24.297, "args": { "External id": 22784,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5375 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651910850.310, "dur": 13.482, "args": { "External id": 22785,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910871.070, "dur": 32.662, "args": { "External id": 22786,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910912.476, "dur": 33.432, "args": { "External id": 22787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910952.474, "dur": 23.619, "args": { "External id": 22788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651910979.920, "dur": 72.302, "args": { "External id": 22789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651911061.887, "dur": 23.829, "args": { "External id": 22790,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651911092.708, "dur": 40.832, "args": { "External id": 22791,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5382 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651911164.713, "dur": 26.514, "args": { "External id": 22792,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5383 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651911212.627, "dur": 38.256, "args": { "External id": 22793,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5384 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651911272.797, "dur": 17.422, "args": { "External id": 22794,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5385 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651911319.487, "dur": 15.556, "args": { "External id": 22795,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5386 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651911351.032, "dur": 15.961, "args": { "External id": 22796,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5387 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911444.515, "dur": 15.950, "args": { "External id": 22797,"Record function id": 0, "Ev Idx": 5388 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911447.781, "dur": 11.601, "args": { "External id": 22798,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911452.306, "dur": 5.998, "args": { "External id": 22799,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5390 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911454.043, "dur": 4.158, "args": { "External id": 22800,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5391 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911464.392, "dur": 5.617, "args": { "External id": 22801,"Record function id": 0, "Ev Idx": 5392 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911465.977, "dur": 3.563, "args": { "External id": 22802,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911467.046, "dur": 1.968, "args": { "External id": 22803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911467.767, "dur": 1.148, "args": { "External id": 22804,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5395 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911473.277, "dur": 3.836, "args": { "External id": 22805,"Record function id": 0, "Ev Idx": 5396 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911474.337, "dur": 2.376, "args": { "External id": 22806,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911475.024, "dur": 1.268, "args": { "External id": 22807,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5398 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911475.538, "dur": 0.684, "args": { "External id": 22808,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5399 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911480.325, "dur": 5.134, "args": { "External id": 22809,"Record function id": 0, "Ev Idx": 5400 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911481.530, "dur": 3.533, "args": { "External id": 22810,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911482.364, "dur": 2.307, "args": { "External id": 22811,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5402 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911482.983, "dur": 1.613, "args": { "External id": 22812,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5403 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911491.757, "dur": 3.914, "args": { "External id": 22813,"Record function id": 0, "Ev Idx": 5404 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911492.945, "dur": 2.272, "args": { "External id": 22814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911493.490, "dur": 1.321, "args": { "External id": 22815,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5406 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911494.087, "dur": 0.642, "args": { "External id": 22816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5407 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911498.721, "dur": 4.309, "args": { "External id": 22817,"Record function id": 0, "Ev Idx": 5408 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911499.983, "dur": 2.618, "args": { "External id": 22818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911500.878, "dur": 1.304, "args": { "External id": 22819,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5410 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911501.285, "dur": 0.785, "args": { "External id": 22820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5411 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911506.398, "dur": 3.616, "args": { "External id": 22821,"Record function id": 0, "Ev Idx": 5412 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911507.512, "dur": 2.089, "args": { "External id": 22822,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911508.036, "dur": 1.151, "args": { "External id": 22823,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5414 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911508.538, "dur": 0.583, "args": { "External id": 22824,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5415 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911513.142, "dur": 3.782, "args": { "External id": 22825,"Record function id": 0, "Ev Idx": 5416 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911514.250, "dur": 2.266, "args": { "External id": 22826,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911514.882, "dur": 1.176, "args": { "External id": 22827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5418 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911515.368, "dur": 0.584, "args": { "External id": 22828,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5419 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911520.052, "dur": 3.349, "args": { "External id": 22829,"Record function id": 0, "Ev Idx": 5420 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651911521.211, "dur": 1.785, "args": { "External id": 22830,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911521.769, "dur": 0.847, "args": { "External id": 22831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5422 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651911522.081, "dur": 0.469, "args": { "External id": 22832,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5423 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651911527.144, "dur": 36422.433, "args": { "External id": 22833,"Record function id": 0, "Sequence number": 246545, "Fwd thread id": 1, "Ev Idx": 5424 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651911528.402, "dur": 36412.477, "args": { "External id": 22834,"Sequence number": 246545, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5425 } }, { "ph": "f", "id": 223, "pid": 1336754, "tid": 1381179, "ts": 1295651911528.402, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651911561.197, "dur": 37.592, "args": { "External id": 22835,"Record function id": 0, "Ev Idx": 5426 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651911606.289, "dur": 68.422, "args": { "External id": 22836,"Record function id": 0, "Ev Idx": 5427 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.2)", "pid": 1336754, "tid": 1381179, "ts": 1295651911680.259, "dur": 36253.004, "args": { "External id": 22837,"Record function id": 0, "Ev Idx": 5428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651911772.081, "dur": 6.460, "args": { "External id": 22838,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651911787.902, "dur": 4.687, "args": { "External id": 22839,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5430 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651911806.699, "dur": 35292.457, "args": { "External id": 22840,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651911820.732, "dur": 35267.841, "args": { "External id": 22841,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651911872.047, "dur": 17.767, "args": { "External id": 22842,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651911895.982, "dur": 35151.972, "args": { "External id": 22843,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651911898.214, "dur": 35149.002, "args": { "External id": 22844,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651911902.153, "dur": 5.071, "args": { "External id": 22845,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651911911.446, "dur": 35131.235, "args": { "External id": 22846,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651947198.291, "dur": 10.927, "args": { "External id": 22847,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651947201.542, "dur": 7.356, "args": { "External id": 22848,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5439 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651947251.800, "dur": 404.333, "args": { "External id": 22849,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651947285.477, "dur": 365.842, "args": { "External id": 22850,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5441, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651947297.940, "dur": 347.533, "args": { "External id": 22851,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5442 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651947675.329, "dur": 2.388, "args": { "External id": 22852,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5443, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947736.325, "dur": 6.851, "args": { "External id": 22853,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947789.145, "dur": 1.384, "args": { "External id": 22854,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947806.898, "dur": 1.278, "args": { "External id": 22855,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947819.446, "dur": 1.024, "args": { "External id": 22856,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947830.653, "dur": 1.130, "args": { "External id": 22857,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947841.656, "dur": 1.258, "args": { "External id": 22858,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947852.749, "dur": 0.925, "args": { "External id": 22859,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947863.206, "dur": 1.582, "args": { "External id": 22860,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651947873.999, "dur": 0.762, "args": { "External id": 22861,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5452 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651947962.927, "dur": 2719.645, "args": { "External id": 22862,"Record function id": 0, "Ev Idx": 5453 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651948019.459, "dur": 1030.108, "args": { "External id": 22863,"Record function id": 0, "Ev Idx": 5454 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651948036.894, "dur": 340.783, "args": { "External id": 22864,"Record function id": 0, "Ev Idx": 5455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948125.740, "dur": 4.915, "args": { "External id": 22865,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948134.053, "dur": 1.840, "args": { "External id": 22866,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948137.664, "dur": 0.954, "args": { "External id": 22867,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948140.576, "dur": 1.056, "args": { "External id": 22868,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948145.205, "dur": 1.403, "args": { "External id": 22869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948148.466, "dur": 0.866, "args": { "External id": 22870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948150.702, "dur": 0.574, "args": { "External id": 22871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948152.542, "dur": 1.389, "args": { "External id": 22872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948157.568, "dur": 0.917, "args": { "External id": 22873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651948159.751, "dur": 0.784, "args": { "External id": 22874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5465 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651948178.012, "dur": 168.803, "args": { "External id": 22875,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651948193.887, "dur": 148.027, "args": { "External id": 22876,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651948210.744, "dur": 12.573, "args": { "External id": 22877,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651948226.387, "dur": 86.450, "args": { "External id": 22878,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651948244.727, "dur": 67.777, "args": { "External id": 22879,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948248.974, "dur": 6.691, "args": { "External id": 22880,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651948257.732, "dur": 54.224, "args": { "External id": 22881,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5472 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::backward_prefetch for model.layers.0", "pid": 1336754, "tid": 1381179, "ts": 1295651948479.466, "dur": 562.100, "args": { "External id": 22882,"Record function id": 0, "Ev Idx": 5473 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651948496.585, "dur": 527.939, "args": { "External id": 22883,"Record function id": 0, "Ev Idx": 5474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651948565.554, "dur": 4.735, "args": { "External id": 22884,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651948586.227, "dur": 25.712, "args": { "External id": 22885,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948591.430, "dur": 1.973, "args": { "External id": 22886,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948595.309, "dur": 0.318, "args": { "External id": 22887,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948597.783, "dur": 0.546, "args": { "External id": 22888,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948600.013, "dur": 0.206, "args": { "External id": 22889,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948601.666, "dur": 0.606, "args": { "External id": 22890,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948603.285, "dur": 0.444, "args": { "External id": 22891,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948605.210, "dur": 0.369, "args": { "External id": 22892,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948606.663, "dur": 0.380, "args": { "External id": 22893,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948608.266, "dur": 0.308, "args": { "External id": 22894,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651948622.006, "dur": 29.911, "args": { "External id": 22895,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5486 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1381179, "ts": 1295651948682.121, "dur": 86.144, "args": { "External id": 22896,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 5487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651948691.581, "dur": 3.099, "args": { "External id": 22897,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1381179, "ts": 1295651948699.508, "dur": 10.042, "args": { "External id": 22898,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1381179, "ts": 1295651948703.680, "dur": 5.451, "args": { "External id": 22899,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 5490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948707.141, "dur": 0.686, "args": { "External id": 22900,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 5491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1381179, "ts": 1295651948716.088, "dur": 19.091, "args": { "External id": 22901,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948717.600, "dur": 0.414, "args": { "External id": 22902,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948719.020, "dur": 0.182, "args": { "External id": 22903,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948720.986, "dur": 0.473, "args": { "External id": 22904,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948722.503, "dur": 0.487, "args": { "External id": 22905,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948723.902, "dur": 0.395, "args": { "External id": 22906,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948724.981, "dur": 0.534, "args": { "External id": 22907,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948727.179, "dur": 0.811, "args": { "External id": 22908,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948728.752, "dur": 0.187, "args": { "External id": 22909,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651948729.991, "dur": 0.197, "args": { "External id": 22910,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651948743.896, "dur": 17.354, "args": { "External id": 22911,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5502 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651948809.951, "dur": 106.457, "args": { "External id": 22912,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 5503 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651948833.207, "dur": 80.060, "args": { "External id": 22913,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5504, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1381179, "ts": 1295651948843.946, "dur": 65.694, "args": { "External id": 22914,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 5505 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651948934.818, "dur": 1.809, "args": { "External id": 22915,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5506, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651949057.641, "dur": 1603.698, "args": { "External id": 22916,"Sequence number": 246544, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5507 } }, { "ph": "f", "id": 224, "pid": 1336754, "tid": 1381179, "ts": 1295651949057.641, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949174.363, "dur": 125.137, "args": { "External id": 22917,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5508 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651949345.310, "dur": 39.959, "args": { "External id": 22918,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651949405.285, "dur": 51.061, "args": { "External id": 22919,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949466.612, "dur": 32.016, "args": { "External id": 22920,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949505.149, "dur": 44.804, "args": { "External id": 22921,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949556.957, "dur": 27.927, "args": { "External id": 22922,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949593.629, "dur": 42.533, "args": { "External id": 22923,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5514 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651949660.031, "dur": 24.982, "args": { "External id": 22924,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5515 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651949704.956, "dur": 26.491, "args": { "External id": 22925,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5516 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651949751.925, "dur": 19.241, "args": { "External id": 22926,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5517 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651949784.025, "dur": 14.094, "args": { "External id": 22927,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949806.612, "dur": 28.131, "args": { "External id": 22928,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651949838.003, "dur": 32.412, "args": { "External id": 22929,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5520 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651949896.138, "dur": 205.116, "args": { "External id": 22930,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651949969.762, "dur": 6.112, "args": { "External id": 22931,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651949977.893, "dur": 2.234, "args": { "External id": 22932,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5523 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651950140.973, "dur": 24.794, "args": { "External id": 22933,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5524 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651950177.277, "dur": 12.369, "args": { "External id": 22934,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950197.866, "dur": 59.965, "args": { "External id": 22935,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950266.452, "dur": 38.198, "args": { "External id": 22936,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950312.093, "dur": 20.792, "args": { "External id": 22937,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950337.295, "dur": 30.581, "args": { "External id": 22938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950373.626, "dur": 19.733, "args": { "External id": 22939,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651950400.350, "dur": 28.955, "args": { "External id": 22940,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5531 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651950449.165, "dur": 21.841, "args": { "External id": 22941,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5532 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651950502.409, "dur": 30.517, "args": { "External id": 22942,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651950553.095, "dur": 17.010, "args": { "External id": 22943,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5534 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651950588.212, "dur": 13.688, "args": { "External id": 22944,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651950617.156, "dur": 14.766, "args": { "External id": 22945,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5536 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950707.985, "dur": 15.324, "args": { "External id": 22946,"Record function id": 0, "Ev Idx": 5537 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950711.374, "dur": 11.014, "args": { "External id": 22947,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950715.404, "dur": 6.000, "args": { "External id": 22948,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5539 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950717.219, "dur": 4.097, "args": { "External id": 22949,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5540 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950727.240, "dur": 5.299, "args": { "External id": 22950,"Record function id": 0, "Ev Idx": 5541 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950728.738, "dur": 3.396, "args": { "External id": 22951,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950729.726, "dur": 1.937, "args": { "External id": 22952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5543 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950730.469, "dur": 1.118, "args": { "External id": 22953,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5544 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950736.017, "dur": 5.217, "args": { "External id": 22954,"Record function id": 0, "Ev Idx": 5545 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950737.414, "dur": 3.383, "args": { "External id": 22955,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950738.416, "dur": 1.909, "args": { "External id": 22956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5547 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950739.150, "dur": 1.067, "args": { "External id": 22957,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5548 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950744.568, "dur": 3.867, "args": { "External id": 22958,"Record function id": 0, "Ev Idx": 5549 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950745.987, "dur": 2.062, "args": { "External id": 22959,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950746.641, "dur": 0.968, "args": { "External id": 22960,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5551 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950747.089, "dur": 0.446, "args": { "External id": 22961,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5552 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950751.616, "dur": 6.509, "args": { "External id": 22962,"Record function id": 0, "Ev Idx": 5553 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950752.705, "dur": 5.005, "args": { "External id": 22963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950753.203, "dur": 3.993, "args": { "External id": 22964,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5555 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950753.480, "dur": 3.651, "args": { "External id": 22965,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5556 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950761.304, "dur": 3.736, "args": { "External id": 22966,"Record function id": 0, "Ev Idx": 5557 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950762.461, "dur": 2.180, "args": { "External id": 22967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950762.940, "dur": 1.280, "args": { "External id": 22968,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5559 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950763.533, "dur": 0.625, "args": { "External id": 22969,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5560 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950768.265, "dur": 3.579, "args": { "External id": 22970,"Record function id": 0, "Ev Idx": 5561 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950769.510, "dur": 1.914, "args": { "External id": 22971,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950769.992, "dur": 0.935, "args": { "External id": 22972,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5563 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950770.364, "dur": 0.502, "args": { "External id": 22973,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5564 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950774.928, "dur": 5.488, "args": { "External id": 22974,"Record function id": 0, "Ev Idx": 5565 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950775.879, "dur": 4.110, "args": { "External id": 22975,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950776.476, "dur": 3.056, "args": { "External id": 22976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5567 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950778.898, "dur": 0.531, "args": { "External id": 22977,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5568 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950783.449, "dur": 3.907, "args": { "External id": 22978,"Record function id": 0, "Ev Idx": 5569 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651950784.607, "dur": 2.351, "args": { "External id": 22979,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950785.056, "dur": 1.474, "args": { "External id": 22980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5571 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651950785.316, "dur": 1.133, "args": { "External id": 22981,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5572 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651950791.175, "dur": 35854.550, "args": { "External id": 22982,"Record function id": 0, "Sequence number": 246543, "Fwd thread id": 1, "Ev Idx": 5573 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651950792.687, "dur": 35844.598, "args": { "External id": 22983,"Sequence number": 246543, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5574 } }, { "ph": "f", "id": 225, "pid": 1336754, "tid": 1381179, "ts": 1295651950792.687, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651950825.193, "dur": 35.279, "args": { "External id": 22984,"Record function id": 0, "Ev Idx": 5575 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651950867.626, "dur": 73.194, "args": { "External id": 22985,"Record function id": 0, "Ev Idx": 5576 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.1)", "pid": 1336754, "tid": 1381179, "ts": 1295651950946.323, "dur": 35682.321, "args": { "External id": 22986,"Record function id": 0, "Ev Idx": 5577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651951095.588, "dur": 7.388, "args": { "External id": 22987,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651951116.331, "dur": 5.153, "args": { "External id": 22988,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651951138.149, "dur": 34702.113, "args": { "External id": 22989,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651951151.668, "dur": 34679.458, "args": { "External id": 22990,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651951203.106, "dur": 21.052, "args": { "External id": 22991,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651951245.333, "dur": 34547.751, "args": { "External id": 22992,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651951248.097, "dur": 34544.394, "args": { "External id": 22993,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651951252.311, "dur": 6.703, "args": { "External id": 22994,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651951261.228, "dur": 34527.845, "args": { "External id": 22995,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295651985931.663, "dur": 9.326, "args": { "External id": 22996,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651985934.487, "dur": 6.169, "args": { "External id": 22997,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5588 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295651985970.107, "dur": 371.162, "args": { "External id": 22998,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5589 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651986025.550, "dur": 310.615, "args": { "External id": 22999,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5590, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295651986038.213, "dur": 292.117, "args": { "External id": 23000,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5591 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295651986364.184, "dur": 2.414, "args": { "External id": 23001,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5592, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986427.000, "dur": 6.824, "args": { "External id": 23002,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986478.686, "dur": 1.426, "args": { "External id": 23003,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986495.405, "dur": 1.305, "args": { "External id": 23004,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986508.712, "dur": 1.347, "args": { "External id": 23005,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986520.552, "dur": 0.904, "args": { "External id": 23006,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986531.784, "dur": 0.780, "args": { "External id": 23007,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986545.002, "dur": 1.147, "args": { "External id": 23008,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986557.099, "dur": 1.562, "args": { "External id": 23009,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986568.032, "dur": 0.558, "args": { "External id": 23010,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5601 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651986659.338, "dur": 2145.434, "args": { "External id": 23011,"Record function id": 0, "Ev Idx": 5602 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_backward (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651986678.255, "dur": 488.079, "args": { "External id": 23012,"Record function id": 0, "Ev Idx": 5603 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651986694.350, "dur": 357.793, "args": { "External id": 23013,"Record function id": 0, "Ev Idx": 5604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986779.855, "dur": 3.982, "args": { "External id": 23014,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986786.915, "dur": 1.008, "args": { "External id": 23015,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986791.813, "dur": 1.149, "args": { "External id": 23016,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986794.710, "dur": 0.980, "args": { "External id": 23017,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986797.419, "dur": 1.050, "args": { "External id": 23018,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986799.587, "dur": 1.292, "args": { "External id": 23019,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986804.193, "dur": 1.316, "args": { "External id": 23020,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986806.984, "dur": 0.793, "args": { "External id": 23021,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986808.980, "dur": 1.084, "args": { "External id": 23022,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651986811.814, "dur": 0.880, "args": { "External id": 23023,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5614 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651986831.612, "dur": 147.995, "args": { "External id": 23024,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651986849.214, "dur": 126.118, "args": { "External id": 23025,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 5616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651986865.613, "dur": 12.478, "args": { "External id": 23026,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651986881.371, "dur": 66.655, "args": { "External id": 23027,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 5618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651986883.988, "dur": 63.750, "args": { "External id": 23028,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 5619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651986887.459, "dur": 5.330, "args": { "External id": 23029,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651986894.459, "dur": 52.646, "args": { "External id": 23030,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 5621 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651987174.322, "dur": 1605.911, "args": { "External id": 23031,"Sequence number": 246542, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5622 } }, { "ph": "f", "id": 226, "pid": 1336754, "tid": 1381179, "ts": 1295651987174.322, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987303.474, "dur": 107.647, "args": { "External id": 23032,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [5632, 1], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 5623 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_add_mul_rsub_silu_0", "pid": 1336754, "tid": 1381179, "ts": 1295651987452.443, "dur": 43.415, "args": { "External id": 23033,"kernel_hash": "cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/fu/cfuhkv7kka2c7zpla7ojjnsceqymafevjnpfblu4fjcq7zkig5bj.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [65536, 5632], [16, 4096, 5632], [16, 4096, 5632], [16, 4096, 5632], []], "Ev Idx": 5624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::bmm", "pid": 1336754, "tid": 1381179, "ts": 1295651987512.100, "dur": 47.971, "args": { "External id": 23034,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[0, 1, 2048], [0, 5632, 1], [11534336, 5632, 1]], "Input Dims": [[1, 2048, 65536], [1, 65536, 5632], [1, 2048, 5632]], "Ev Idx": 5625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987569.101, "dur": 32.050, "args": { "External id": 23035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987607.178, "dur": 45.859, "args": { "External id": 23036,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987660.363, "dur": 28.462, "args": { "External id": 23037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 5632], [2048, 1], [2048, 1]], "Input Dims": [[5632, 65536], [65536, 2048], [5632, 2048]], "Ev Idx": 5628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987695.979, "dur": 42.669, "args": { "External id": 23038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 5629 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_1", "pid": 1336754, "tid": 1381179, "ts": 1295651987763.053, "dur": 22.254, "args": { "External id": 23039,"kernel_hash": "cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/wm/cwmdtyuwgj7j3fxg57ckso72wqi2qzdp23gsirbcv7772zguon5s.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 5630 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_0", "pid": 1336754, "tid": 1381179, "ts": 1295651987806.812, "dur": 28.552, "args": { "External id": 23040,"kernel_hash": "cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "True", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/br/cbr4fu2k5yr5uawq4iznngbgj5pxe5dndn6dpk7pftmhdoiq6bbz.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5631 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651987875.325, "dur": 20.987, "args": { "External id": 23041,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5632 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651987910.641, "dur": 14.769, "args": { "External id": 23042,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987932.870, "dur": 28.864, "args": { "External id": 23043,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651987964.945, "dur": 70.165, "args": { "External id": 23044,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5635 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_backward", "pid": 1336754, "tid": 1381179, "ts": 1295651988065.245, "dur": 187.476, "args": { "External id": 23045,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar", "long int"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [131072, 4096, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [1]], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 32, 4096], [16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [2]], "Ev Idx": 5636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651988145.065, "dur": 6.821, "args": { "External id": 23046,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651988156.623, "dur": 1.619, "args": { "External id": 23047,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5638 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651988292.859, "dur": 28.348, "args": { "External id": 23048,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5639 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1381179, "ts": 1295651988335.141, "dur": 13.831, "args": { "External id": 23049,"kernel_hash": "cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "True"], "kernel_file": "/tmp/torchinductor_cvm/x2/cx2glzcaftzl4kfweo3o3hwtcmldzbfyqvcfcw2pz2jtvbtjqryt.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988357.924, "dur": 42.395, "args": { "External id": 23050,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988406.836, "dur": 36.846, "args": { "External id": 23051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988450.414, "dur": 20.706, "args": { "External id": 23052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988475.466, "dur": 29.684, "args": { "External id": 23053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988510.754, "dur": 22.875, "args": { "External id": 23054,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 2048], [2048, 1], [2048, 1]], "Input Dims": [[2048, 65536], [65536, 2048], [2048, 2048]], "Ev Idx": 5645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1381179, "ts": 1295651988541.613, "dur": 30.640, "args": { "External id": 23055,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 5646 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_4", "pid": 1336754, "tid": 1381179, "ts": 1295651988594.808, "dur": 22.108, "args": { "External id": 23056,"kernel_hash": "c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/6w/c6w57dwqlavni5blikci5m4csat5hnlhey5taj7vfkseu26zork7.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [65536, 2048], []], "Ev Idx": 5647 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_bwd_kernel_2", "pid": 1336754, "tid": 1381179, "ts": 1295651988634.325, "dur": 26.998, "args": { "External id": 23057,"kernel_hash": "c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "65536", "2048", "1", "497", "132", "True", "2048", "False", "False", "True", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/4k/c4kzku375wvjr3l7odspnz7rfogvuxnctfgzi5ygczeoztmm5agk.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [2048], [65536, 2048], [65536, 2048], [132, 2048], [65536], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 5648 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_red_fused_sum_2", "pid": 1336754, "tid": 1381179, "ts": 1295651988678.212, "dur": 19.363, "args": { "External id": 23058,"kernel_hash": "ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl", "grid": "grid(4096,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "4096", "66"], "kernel_file": "/tmp/torchinductor_cvm/eo/ceozqyu7bzyhxbdlyjtvnat56d7ry6756gzuyvjf77ovbjuz4uhl.py", "kernel_backend": "triton", "Input type": ["float", "float", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [4096, 1, 2048], [], []], "Input Dims": [[132, 2048], [1, 2048, 2], [], []], "Ev Idx": 5649 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_per_fused__to_copy_sum_3", "pid": 1336754, "tid": 1381179, "ts": 1295651988711.960, "dur": 13.649, "args": { "External id": 23059,"kernel_hash": "ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk", "grid": "grid(2048,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "2048", "2"], "kernel_file": "/tmp/torchinductor_cvm/cn/ccn5gbptcig4tn232fiwehcb54hd6zxt5b2su6bhwqzwbeu53yqk.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 2048], [2048, 1], [], []], "Input Dims": [[1, 2048, 2], [1, 2048], [], []], "Ev Idx": 5650 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_5", "pid": 1336754, "tid": 1381179, "ts": 1295651988739.390, "dur": 14.953, "args": { "External id": 23060,"kernel_hash": "cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/eb/cebp6425kwg6qjs7vc5dpxqx2tgnwzzcolkzg6q26v5rzluozz5b.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], [16, 4096, 2048], []], "Ev Idx": 5651 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988827.391, "dur": 14.996, "args": { "External id": 23061,"Record function id": 0, "Ev Idx": 5652 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988830.796, "dur": 10.630, "args": { "External id": 23062,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988834.701, "dur": 5.784, "args": { "External id": 23063,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5654 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988836.252, "dur": 4.131, "args": { "External id": 23064,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5655 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988846.192, "dur": 4.930, "args": { "External id": 23065,"Record function id": 0, "Ev Idx": 5656 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988847.715, "dur": 2.939, "args": { "External id": 23066,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988848.519, "dur": 1.647, "args": { "External id": 23067,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5658 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988849.188, "dur": 0.917, "args": { "External id": 23068,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5659 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988854.502, "dur": 5.086, "args": { "External id": 23069,"Record function id": 0, "Ev Idx": 5660 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988856.044, "dur": 3.111, "args": { "External id": 23070,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988857.003, "dur": 1.680, "args": { "External id": 23071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5662 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988857.773, "dur": 0.771, "args": { "External id": 23072,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[2048]], "Ev Idx": 5663 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988862.771, "dur": 4.642, "args": { "External id": 23073,"Record function id": 0, "Ev Idx": 5664 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988864.461, "dur": 2.563, "args": { "External id": 23074,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988865.249, "dur": 1.306, "args": { "External id": 23075,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5666 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988865.868, "dur": 0.610, "args": { "External id": 23076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 5667 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988870.557, "dur": 4.495, "args": { "External id": 23077,"Record function id": 0, "Ev Idx": 5668 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988872.002, "dur": 2.641, "args": { "External id": 23078,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988872.731, "dur": 1.363, "args": { "External id": 23079,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5670 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988873.323, "dur": 0.703, "args": { "External id": 23080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5671 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988878.129, "dur": 4.893, "args": { "External id": 23081,"Record function id": 0, "Ev Idx": 5672 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988879.986, "dur": 2.610, "args": { "External id": 23082,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988880.475, "dur": 1.688, "args": { "External id": 23083,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5674 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988881.303, "dur": 0.795, "args": { "External id": 23084,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5675 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988886.355, "dur": 3.770, "args": { "External id": 23085,"Record function id": 0, "Ev Idx": 5676 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988887.642, "dur": 2.035, "args": { "External id": 23086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988888.315, "dur": 0.941, "args": { "External id": 23087,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5678 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988888.605, "dur": 0.584, "args": { "External id": 23088,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5679 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988893.242, "dur": 4.151, "args": { "External id": 23089,"Record function id": 0, "Ev Idx": 5680 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988894.796, "dur": 2.191, "args": { "External id": 23090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988895.416, "dur": 1.139, "args": { "External id": 23091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5682 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988895.912, "dur": 0.576, "args": { "External id": 23092,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 5683 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988900.399, "dur": 6.160, "args": { "External id": 23093,"Record function id": 0, "Ev Idx": 5684 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295651988901.583, "dur": 4.519, "args": { "External id": 23094,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988902.603, "dur": 3.058, "args": { "External id": 23095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5686 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295651988905.102, "dur": 0.461, "args": { "External id": 23096,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 5687 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651988910.123, "dur": 36054.319, "args": { "External id": 23097,"Record function id": 0, "Sequence number": 246541, "Fwd thread id": 1, "Ev Idx": 5688 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295651988911.749, "dur": 36043.699, "args": { "External id": 23098,"Sequence number": 246541, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5689 } }, { "ph": "f", "id": 227, "pid": 1336754, "tid": 1381179, "ts": 1295651988911.749, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651988940.074, "dur": 39.204, "args": { "External id": 23099,"Record function id": 0, "Ev Idx": 5690 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651989028.258, "dur": 74.021, "args": { "External id": 23100,"Record function id": 0, "Ev Idx": 5691 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce (model.layers.0)", "pid": 1336754, "tid": 1381179, "ts": 1295651989109.509, "dur": 35838.796, "args": { "External id": 23101,"Record function id": 0, "Ev Idx": 5692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651989216.201, "dur": 7.901, "args": { "External id": 23102,"Record function id": 0, "Concrete Inputs": ["[51384320]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295651989254.336, "dur": 5.512, "args": { "External id": 23103,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 5694 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651989276.243, "dur": 34893.555, "args": { "External id": 23104,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295651989290.550, "dur": 34868.983, "args": { "External id": 23105,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[[1], [2048, 1], [2048, 1], [2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], [], [], [6423040, 1]], "Input Dims": [[[2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], [], [], [8, 6423040]], "Ev Idx": 5696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295651989340.130, "dur": 18.673, "args": { "External id": 23106,"Record function id": 0, "Concrete Inputs": ["[12602]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295651989364.833, "dur": 34755.499, "args": { "External id": 23107,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], [], []], "Ev Idx": 5698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295651989367.766, "dur": 34751.840, "args": { "External id": 23108,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[12602], [], [], [], [], [], []], "Ev Idx": 5699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295651989371.516, "dur": 6.723, "args": { "External id": 23109,"Record function id": 0, "Concrete Inputs": ["[12602]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295651989379.862, "dur": 34735.681, "args": { "External id": 23110,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[12602], [12602], []], "Ev Idx": 5701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295652024282.122, "dur": 13.764, "args": { "External id": 23111,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[51384320], [], [], [], [], []], "Ev Idx": 5702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295652024285.451, "dur": 9.947, "args": { "External id": 23112,"Record function id": 0, "Concrete Inputs": ["[6423040]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5703 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295652024325.144, "dur": 343.733, "args": { "External id": 23113,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[6423040], [51384320], [], [], [], []], "Ev Idx": 5704 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295652024356.140, "dur": 308.418, "args": { "External id": 23114,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 6423040, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[51384320], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5705, "In msg nelems": 51384320 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295652024367.680, "dur": 291.994, "args": { "External id": 23115,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[51384320]], "Ev Idx": 5706 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295652024686.359, "dur": 2.267, "args": { "External id": 23116,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5707, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024745.255, "dur": 6.642, "args": { "External id": 23117,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024797.816, "dur": 1.504, "args": { "External id": 23118,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024815.281, "dur": 1.411, "args": { "External id": 23119,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "524544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024828.250, "dur": 0.888, "args": { "External id": 23120,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1048832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024841.724, "dur": 1.163, "args": { "External id": 23121,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "1573120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024852.224, "dur": 0.943, "args": { "External id": 23122,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024863.175, "dur": 1.208, "args": { "External id": 23123,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "2097664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024874.504, "dur": 1.224, "args": { "External id": 23124,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "3539456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652024887.447, "dur": 1.368, "args": { "External id": 23125,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "4981248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5716 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295652024978.423, "dur": 334.341, "args": { "External id": 23126,"Record function id": 0, "Sequence number": 246540, "Fwd thread id": 1, "Ev Idx": 5717 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunctionBackward", "pid": 1336754, "tid": 1381179, "ts": 1295652025016.841, "dur": 286.538, "args": { "External id": 23127,"Sequence number": 246540, "Fwd thread id": 1, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 5718 } }, { "ph": "f", "id": 228, "pid": 1336754, "tid": 1381179, "ts": 1295652025016.841, "cat": "fwdbwd", "name": "fwdbwd", "bp": "e" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_0", "pid": 1336754, "tid": 1381179, "ts": 1295652025145.200, "dur": 44.975, "args": { "External id": 23128,"kernel_hash": "c6aziuyp6fagrmcedyk7wtb6g56x7av3etx5bs4re25wo6lnvnsr", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/6a/c6aziuyp6fagrmcedyk7wtb6g56x7av3etx5bs4re25wo6lnvnsr.py", "kernel_backend": "triton", "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 5719 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_1", "pid": 1336754, "tid": 1381179, "ts": 1295652025204.247, "dur": 39.960, "args": { "External id": 23129,"kernel_hash": "cltgraj4uipr7sa5n4ns4uyvanquunkc3ybdvrfy5pw2v2cf6swt", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/lt/cltgraj4uipr7sa5n4ns4uyvanquunkc3ybdvrfy5pw2v2cf6swt.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "float", "Scalar"], "Input Strides": [[4096, 1], [8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096], [16, 4096, 2048], [32000, 2048], []], "Ev Idx": 5720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_dense_backward_2", "pid": 1336754, "tid": 1381179, "ts": 1295652025266.423, "dur": 21.469, "args": { "External id": 23130,"kernel_hash": "chiuzhe4yx4geeiep36ony2tqipsfvpo7rwythdxblopxivdgss3", "grid": "grid(65536000,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "65536000"], "kernel_file": "/tmp/torchinductor_cvm/hi/chiuzhe4yx4geeiep36ony2tqipsfvpo7rwythdxblopxivdgss3.py", "kernel_backend": "triton", "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 5721 } }, { "ph": "X", "cat": "cpu_op", "name": "autograd::engine::evaluate_function: torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295652025325.957, "dur": 14.737, "args": { "External id": 23131,"Record function id": 0, "Ev Idx": 5722 } }, { "ph": "X", "cat": "cpu_op", "name": "torch::autograd::AccumulateGrad", "pid": 1336754, "tid": 1381179, "ts": 1295652025328.801, "dur": 11.104, "args": { "External id": 23132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1381179, "ts": 1295652025332.526, "dur": 6.527, "args": { "External id": 23133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5724 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1381179, "ts": 1295652025334.161, "dur": 4.801, "args": { "External id": 23134,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 5725 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_post_backward_callback", "pid": 1336754, "tid": 1381179, "ts": 1295652025364.166, "dur": 7699.768, "args": { "External id": 23135,"Record function id": 0, "Ev Idx": 5726 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_accumulate", "pid": 1336754, "tid": 1381179, "ts": 1295652025386.434, "dur": 39.778, "args": { "External id": 23136,"Record function id": 0, "Ev Idx": 5727 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reshard", "pid": 1336754, "tid": 1381179, "ts": 1295652025432.160, "dur": 285.775, "args": { "External id": 23137,"Record function id": 0, "Ev Idx": 5728 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_backward_reduce", "pid": 1336754, "tid": 1381179, "ts": 1295652025724.094, "dur": 6966.291, "args": { "External id": 23138,"Record function id": 0, "Ev Idx": 5729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295652025844.987, "dur": 6.576, "args": { "External id": 23139,"Record function id": 0, "Concrete Inputs": ["[336611328]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1381179, "ts": 1295652025860.681, "dur": 5.128, "args": { "External id": 23140,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5731 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295652025888.003, "dur": 5504.024, "args": { "External id": 23141,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_chunk_cat", "pid": 1336754, "tid": 1381179, "ts": 1295652025906.913, "dur": 5471.716, "args": { "External id": 23142,"Record function id": 0, "Concrete Inputs": ["", "0", "8", ""], "Input type": ["TensorList", "Scalar", "Scalar", "float"], "Input Strides": [[], [], [], [42076416, 1]], "Input Dims": [[], [], [], [8, 42076416]], "Ev Idx": 5733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295652026223.668, "dur": 36.003, "args": { "External id": 23143,"Record function id": 0, "Concrete Inputs": ["[82421]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1381179, "ts": 1295652026333.646, "dur": 4989.683, "args": { "External id": 23144,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], [], []], "Ev Idx": 5735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1381179, "ts": 1295652026337.047, "dur": 4985.390, "args": { "External id": 23145,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[82421], [], [], [], [], [], []], "Ev Idx": 5736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652026341.967, "dur": 15.264, "args": { "External id": 23146,"Record function id": 0, "Concrete Inputs": ["[82421]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1381179, "ts": 1295652026359.392, "dur": 4957.557, "args": { "External id": 23147,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[82421], [82421], []], "Ev Idx": 5738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1381179, "ts": 1295652031542.744, "dur": 11.700, "args": { "External id": 23148,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "", "", "", "False"], "Input type": ["float", "ScalarList", "", "", "", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[336611328], [], [], [], [], []], "Ev Idx": 5739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1381179, "ts": 1295652031546.100, "dur": 7.971, "args": { "External id": 23149,"Record function id": 0, "Concrete Inputs": ["[42076416]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5740 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_reduce_scatter_base_", "pid": 1336754, "tid": 1381179, "ts": 1295652031583.583, "dur": 461.042, "args": { "External id": 23150,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "-1"], "Input type": ["float", "float", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], [], []], "Input Dims": [[42076416], [336611328], [], [], [], []], "Ev Idx": 5741 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295652031614.505, "dur": 425.319, "args": { "External id": 23151,"Record function id": 0, "Collective name": "_reduce_scatter_base", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 42076416, "Process Group Name": "0", "Input type": ["float", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[336611328], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5742, "In msg nelems": 336611328 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_reduce_scatter_base", "pid": 1336754, "tid": 1381179, "ts": 1295652031630.633, "dur": 402.859, "args": { "External id": 23152,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[336611328]], "Ev Idx": 5743 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1381179, "ts": 1295652032068.725, "dur": 2.604, "args": { "External id": 23153,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5744, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032135.029, "dur": 6.894, "args": { "External id": 23154,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032189.217, "dur": 1.058, "args": { "External id": 23155,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032206.204, "dur": 1.756, "args": { "External id": 23156,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8192256"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032219.575, "dur": 0.940, "args": { "External id": 23157,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "8716544"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032249.303, "dur": 1.988, "args": { "External id": 23158,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9240832"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032263.210, "dur": 0.705, "args": { "External id": 23159,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "9765120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032275.181, "dur": 1.576, "args": { "External id": 23160,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032287.463, "dur": 0.952, "args": { "External id": 23161,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "10289664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032299.915, "dur": 1.741, "args": { "External id": 23162,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "11731456"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032311.155, "dur": 0.854, "args": { "External id": 23163,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "13173248"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032322.112, "dur": 1.180, "args": { "External id": 23164,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032332.614, "dur": 0.764, "args": { "External id": 23165,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "14615296"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032345.873, "dur": 1.154, "args": { "External id": 23166,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15139584"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032356.626, "dur": 0.704, "args": { "External id": 23167,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "15663872"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032367.097, "dur": 1.115, "args": { "External id": 23168,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "16188160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032377.747, "dur": 1.180, "args": { "External id": 23169,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032388.251, "dur": 1.674, "args": { "External id": 23170,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "16712704"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032401.502, "dur": 0.795, "args": { "External id": 23171,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "18154496"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032412.350, "dur": 1.172, "args": { "External id": 23172,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "19596288"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032422.796, "dur": 1.180, "args": { "External id": 23173,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032434.266, "dur": 1.678, "args": { "External id": 23174,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21038336"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032445.129, "dur": 0.704, "args": { "External id": 23175,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "21562624"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032457.273, "dur": 1.229, "args": { "External id": 23176,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22086912"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032467.846, "dur": 0.880, "args": { "External id": 23177,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "22611200"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032478.571, "dur": 1.380, "args": { "External id": 23178,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032488.433, "dur": 1.004, "args": { "External id": 23179,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "23135744"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032498.739, "dur": 1.410, "args": { "External id": 23180,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "24577536"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032510.667, "dur": 0.908, "args": { "External id": 23181,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "26019328"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032521.709, "dur": 1.204, "args": { "External id": 23182,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032531.777, "dur": 1.174, "args": { "External id": 23183,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27461376"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032543.149, "dur": 1.171, "args": { "External id": 23184,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "27985664"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032553.593, "dur": 0.864, "args": { "External id": 23185,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "28509952"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032563.188, "dur": 1.286, "args": { "External id": 23186,"Record function id": 0, "Concrete Inputs": ["", "[256, 2048]", "[2048, 1]", "29034240"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032572.724, "dur": 0.872, "args": { "External id": 23187,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032585.119, "dur": 1.440, "args": { "External id": 23188,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "29558784"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032595.655, "dur": 1.097, "args": { "External id": 23189,"Record function id": 0, "Concrete Inputs": ["", "[704, 2048]", "[2048, 1]", "31000576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032607.581, "dur": 1.381, "args": { "External id": 23190,"Record function id": 0, "Concrete Inputs": ["", "[256, 5632]", "[5632, 1]", "32442368"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032617.628, "dur": 0.533, "args": { "External id": 23191,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1381179, "ts": 1295652032626.702, "dur": 1.118, "args": { "External id": 23192,"Record function id": 0, "Concrete Inputs": ["", "[4000, 2048]", "[2048, 1]", "33884416"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5783 } }, { "ph": "X", "cat": "user_annotation", "name": "ProfilerStep#1023", "pid": 1336754, "tid": 1336754, "ts": 1295649886584.184, "dur": 2164551.036, "args": { "External id": 12289,"Record function id": 0, "Ev Idx": 5784 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.zero_grad#AdamW.zero_grad", "pid": 1336754, "tid": 1336754, "ts": 1295649886616.093, "dur": 663.698, "args": { "External id": 12290,"Record function id": 0, "Ev Idx": 5785 } }, { "ph": "X", "cat": "user_annotation", "name": "enumerate(DataLoader)#_StatefulMultiProcessingDataLoaderIter.__next__", "pid": 1336754, "tid": 1336754, "ts": 1295649887323.780, "dur": 2160.508, "args": { "External id": 12291,"Record function id": 0, "Ev Idx": 5786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649888491.428, "dur": 8.057, "args": { "External id": 12292,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336754, "tid": 1336754, "ts": 1295649888520.090, "dur": 6.528, "args": { "External id": 12293,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649888947.443, "dur": 2.300, "args": { "External id": 12294,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336754, "tid": 1336754, "ts": 1295649888956.812, "dur": 2.593, "args": { "External id": 12295,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649889373.259, "dur": 2.049, "args": { "External id": 12296,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::set_", "pid": 1336754, "tid": 1336754, "ts": 1295649889382.161, "dur": 2.318, "args": { "External id": 12297,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "0", "[16, 8192]", "[8192, 1]"], "Input type": ["long int", "", "Scalar", "ScalarList", "ScalarList"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[0], [], [], [], []], "Ev Idx": 5792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649890009.998, "dur": 14.398, "args": { "External id": 12298,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649890017.910, "dur": 2.196, "args": { "External id": 12299,"Record function id": 0, "Concrete Inputs": ["", "[16, 8192]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649890026.598, "dur": 4.501, "args": { "External id": 12300,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], []], "Ev Idx": 5795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649890028.761, "dur": 1.199, "args": { "External id": 12301,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 5796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649890058.419, "dur": 499.966, "args": { "External id": 12302,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], [], []], "Ev Idx": 5797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649890065.901, "dur": 491.495, "args": { "External id": 12303,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649890073.435, "dur": 10.084, "args": { "External id": 12304,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649890085.833, "dur": 469.599, "args": { "External id": 12305,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649890095.516, "dur": 0.736, "args": { "External id": 12306,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336754, "tid": 1336754, "ts": 1295649890099.470, "dur": 8.596, "args": { "External id": 12307,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[8192, 1], [4096, 1]], "Input Dims": [[16, 4096], [16, 4096]], "Ev Idx": 5802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336754, "tid": 1336754, "ts": 1295649890104.468, "dur": 3.442, "args": { "External id": 12308,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], []], "Input Dims": [[16, 4096], [], []], "Ev Idx": 5803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649890107.094, "dur": 0.570, "args": { "External id": 12309,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295649890110.702, "dur": 194.565, "args": { "External id": 12310,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295649890113.452, "dur": 191.441, "args": { "External id": 12311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 5806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295649890115.516, "dur": 14.661, "args": { "External id": 12312,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 5807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649890117.813, "dur": 11.873, "args": { "External id": 12313,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649890131.238, "dur": 172.472, "args": { "External id": 12314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649890307.972, "dur": 244.201, "args": { "External id": 12315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649890576.718, "dur": 527.450, "args": { "External id": 12316,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 5811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649890578.616, "dur": 524.501, "args": { "External id": 12317,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], []], "Ev Idx": 5812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649890585.220, "dur": 8.331, "args": { "External id": 12318,"Record function id": 0, "Concrete Inputs": ["[16, 8192]", "[8192, 1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649890594.880, "dur": 503.526, "args": { "External id": 12319,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[8192, 1], [8192, 1], []], "Input Dims": [[16, 8192], [16, 8192], []], "Ev Idx": 5814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336754, "tid": 1336754, "ts": 1295649891136.507, "dur": 56.434, "args": { "External id": 12320,"Record function id": 0, "Concrete Inputs": ["0", "4096", "", "", "", "False"], "Input type": ["Scalar", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649891141.962, "dur": 6.143, "args": { "External id": 12321,"Record function id": 0, "Concrete Inputs": ["[0]", "4", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::arange", "pid": 1336754, "tid": 1336754, "ts": 1295649891151.370, "dur": 41.180, "args": { "External id": 12322,"Record function id": 0, "Concrete Inputs": ["0", "4096", "1", ""], "Input type": ["Scalar", "Scalar", "Scalar", "long int"], "Input Strides": [[], [], [], [1]], "Input Dims": [[], [], [], [0]], "Ev Idx": 5817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295649891156.567, "dur": 7.038, "args": { "External id": 12323,"Record function id": 0, "Concrete Inputs": ["", "[4096]", ""], "Input type": ["long int", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 5818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::repeat", "pid": 1336754, "tid": 1336754, "ts": 1295649891205.920, "dur": 95.003, "args": { "External id": 12324,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4096], []], "Ev Idx": 5819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336754, "tid": 1336754, "ts": 1295649891210.359, "dur": 7.041, "args": { "External id": 12325,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[4096], [], []], "Ev Idx": 5820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891215.293, "dur": 1.790, "args": { "External id": 12326,"Record function id": 0, "Concrete Inputs": ["", "[1, 4096]", "[4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[4096], [], [], []], "Ev Idx": 5821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649891218.443, "dur": 4.595, "args": { "External id": 12327,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1336754, "ts": 1295649891225.074, "dur": 21.740, "args": { "External id": 12328,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[4096, 1]], "Input Dims": [[16, 4096]], "Ev Idx": 5823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336754, "tid": 1336754, "ts": 1295649891252.594, "dur": 6.114, "args": { "External id": 12329,"Record function id": 0, "Concrete Inputs": ["", "0", "1", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891257.731, "dur": 0.801, "args": { "External id": 12330,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 1]", "[4096, 1, 4096]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 5825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336754, "tid": 1336754, "ts": 1295649891259.669, "dur": 3.909, "args": { "External id": 12331,"Record function id": 0, "Concrete Inputs": ["", "1", "4096", "4096"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891262.653, "dur": 0.828, "args": { "External id": 12332,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[4096, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1, 4096], [], [], []], "Input Dims": [[16, 4096, 1], [], [], []], "Ev Idx": 5827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand_as", "pid": 1336754, "tid": 1336754, "ts": 1295649891265.823, "dur": 3.585, "args": { "External id": 12333,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["long int", "long int"], "Input Strides": [[4096, 1], [4096, 4096, 4096, 1]], "Input Dims": [[1, 4096], [16, 1, 1, 4096]], "Ev Idx": 5828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::expand", "pid": 1336754, "tid": 1336754, "ts": 1295649891267.074, "dur": 2.231, "args": { "External id": 12334,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "False"], "Input type": ["long int", "ScalarList", "Scalar"], "Input Strides": [[4096, 1], [], []], "Input Dims": [[1, 4096], [], []], "Ev Idx": 5829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891268.461, "dur": 0.738, "args": { "External id": 12335,"Record function id": 0, "Concrete Inputs": ["", "[16, 1, 1, 4096]", "[0, 4096, 4096, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[4096, 1], [], [], []], "Input Dims": [[1, 4096], [], [], []], "Ev Idx": 5830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649891270.475, "dur": 29.682, "args": { "External id": 12336,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 4096, 4096, 1], [0, 4096, 4096, 1], []], "Input Dims": [[16, 1, 1, 4096], [16, 1, 1, 4096], []], "Ev Idx": 5831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649891310.383, "dur": 30.637, "args": { "External id": 12337,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 5832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649891312.272, "dur": 28.573, "args": { "External id": 12338,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "3", "", "", "", "False", ""], "Input type": ["long int", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[4096, 1], [], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], [], []], "Ev Idx": 5833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891319.234, "dur": 3.322, "args": { "External id": 12339,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "[4096, 1]", "3", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649891323.384, "dur": 16.946, "args": { "External id": 12340,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["int", "long int", "Scalar"], "Input Strides": [[4096, 1], [4096, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 5835 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::root_pre_forward", "pid": 1336754, "tid": 1336754, "ts": 1295649891451.722, "dur": 145.525, "args": { "External id": 12341,"Record function id": 0, "Ev Idx": 5836 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::inputs_to_device", "pid": 1336754, "tid": 1336754, "ts": 1295649891530.704, "dur": 56.169, "args": { "External id": 12342,"Record function id": 0, "Ev Idx": 5837 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295649891604.446, "dur": 42.425, "args": { "External id": 12343,"Record function id": 0, "Ev Idx": 5838 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward", "pid": 1336754, "tid": 1336754, "ts": 1295649891655.197, "dur": 10005.304, "args": { "External id": 12344,"Record function id": 0, "Ev Idx": 5839 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather", "pid": 1336754, "tid": 1336754, "ts": 1295649891663.872, "dur": 1209.374, "args": { "External id": 12345,"Record function id": 0, "Ev Idx": 5840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649891765.697, "dur": 6.481, "args": { "External id": 12346,"Record function id": 0, "Concrete Inputs": ["[42076416]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649891788.974, "dur": 110.408, "args": { "External id": 12347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891793.631, "dur": 1.634, "args": { "External id": 12348,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891800.021, "dur": 0.264, "args": { "External id": 12349,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8192000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891801.281, "dur": 0.288, "args": { "External id": 12350,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8192256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891802.291, "dur": 1.477, "args": { "External id": 12351,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "8716544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891807.869, "dur": 0.435, "args": { "External id": 12352,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9240832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891809.215, "dur": 0.392, "args": { "External id": 12353,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "9765120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891810.281, "dur": 2.558, "args": { "External id": 12354,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "10289408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891814.476, "dur": 0.173, "args": { "External id": 12355,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "10289664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891815.406, "dur": 0.295, "args": { "External id": 12356,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11731456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891820.098, "dur": 0.208, "args": { "External id": 12357,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "13173248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891821.281, "dur": 0.288, "args": { "External id": 12358,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "14615040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891822.493, "dur": 1.266, "args": { "External id": 12359,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "14615296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891826.677, "dur": 0.302, "args": { "External id": 12360,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15139584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891827.848, "dur": 0.317, "args": { "External id": 12361,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "15663872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891829.206, "dur": 2.427, "args": { "External id": 12362,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "16188160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891832.741, "dur": 0.152, "args": { "External id": 12363,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "16712448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891833.751, "dur": 0.171, "args": { "External id": 12364,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "16712704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891836.934, "dur": 0.330, "args": { "External id": 12365,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "18154496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891838.056, "dur": 0.302, "args": { "External id": 12366,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "19596288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891839.387, "dur": 1.520, "args": { "External id": 12367,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "21038080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891844.019, "dur": 0.325, "args": { "External id": 12368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21038336"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891845.379, "dur": 0.283, "args": { "External id": 12369,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "21562624"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891846.565, "dur": 2.792, "args": { "External id": 12370,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22086912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891850.466, "dur": 0.172, "args": { "External id": 12371,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "22611200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891851.488, "dur": 0.261, "args": { "External id": 12372,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "23135488"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891854.958, "dur": 0.402, "args": { "External id": 12373,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "23135744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891856.175, "dur": 0.285, "args": { "External id": 12374,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "24577536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891857.735, "dur": 1.070, "args": { "External id": 12375,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "26019328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891861.957, "dur": 0.456, "args": { "External id": 12376,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "27461120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891863.403, "dur": 0.335, "args": { "External id": 12377,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27461376"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891864.819, "dur": 2.383, "args": { "External id": 12378,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "27985664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891868.220, "dur": 0.151, "args": { "External id": 12379,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "28509952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891869.318, "dur": 0.346, "args": { "External id": 12380,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "29034240"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891872.932, "dur": 0.312, "args": { "External id": 12381,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "29558528"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891874.097, "dur": 0.294, "args": { "External id": 12382,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "29558784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891875.447, "dur": 1.077, "args": { "External id": 12383,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "31000576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891879.658, "dur": 0.307, "args": { "External id": 12384,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "32442368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891881.017, "dur": 0.345, "args": { "External id": 12385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "33884160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649891882.193, "dur": 2.615, "args": { "External id": 12386,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "33884416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649891919.189, "dur": 112.935, "args": { "External id": 12387,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5882 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295649892102.489, "dur": 257.620, "args": { "External id": 12388,"Record function id": 0, "Concrete Inputs": ["", "", "42076416", "8", "1", "15", ""], "Input type": ["TensorList", "", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], []], "Ev Idx": 5883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649892118.549, "dur": 5.531, "args": { "External id": 12389,"Record function id": 0, "Concrete Inputs": ["[336611328]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295649892130.080, "dur": 12.355, "args": { "External id": 12390,"Record function id": 0, "Concrete Inputs": ["", "0", "42076416", "42076416"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649892135.028, "dur": 7.007, "args": { "External id": 12391,"Record function id": 0, "Concrete Inputs": ["", "0", "42076416", "84152832", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[336611328], [], [], [], []], "Ev Idx": 5886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892138.493, "dur": 0.804, "args": { "External id": 12392,"Record function id": 0, "Concrete Inputs": ["", "[42076416]", "[1]", "42076416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[336611328], [], [], []], "Ev Idx": 5887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649892150.755, "dur": 114.981, "args": { "External id": 12393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["c10::BFloat16", "", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[42076416], [], []], "Ev Idx": 5888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892152.989, "dur": 0.641, "args": { "External id": 12394,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "42076416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892155.168, "dur": 0.178, "args": { "External id": 12395,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "50268416"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892156.315, "dur": 1.319, "args": { "External id": 12396,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "50268672"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892158.596, "dur": 0.702, "args": { "External id": 12397,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "50792960"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892160.314, "dur": 0.339, "args": { "External id": 12398,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "51317248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892161.741, "dur": 0.286, "args": { "External id": 12399,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "51841536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892163.641, "dur": 0.311, "args": { "External id": 12400,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "52365824"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892165.634, "dur": 0.177, "args": { "External id": 12401,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "52366080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892166.857, "dur": 0.599, "args": { "External id": 12402,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "53807872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892168.433, "dur": 0.180, "args": { "External id": 12403,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "55249664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892169.525, "dur": 1.121, "args": { "External id": 12404,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "56691456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892171.914, "dur": 0.314, "args": { "External id": 12405,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "56691712"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892173.101, "dur": 2.597, "args": { "External id": 12406,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "57216000"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892176.591, "dur": 0.338, "args": { "External id": 12407,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "57740288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892178.042, "dur": 0.225, "args": { "External id": 12408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "58264576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892181.522, "dur": 0.336, "args": { "External id": 12409,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "58788864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892183.168, "dur": 0.314, "args": { "External id": 12410,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "58789120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892184.890, "dur": 0.321, "args": { "External id": 12411,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "60230912"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892188.355, "dur": 1.189, "args": { "External id": 12412,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "61672704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892190.346, "dur": 0.170, "args": { "External id": 12413,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "63114496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892191.544, "dur": 2.338, "args": { "External id": 12414,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "63114752"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892195.201, "dur": 0.379, "args": { "External id": 12415,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "63639040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892196.688, "dur": 0.158, "args": { "External id": 12416,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "64163328"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892201.236, "dur": 0.154, "args": { "External id": 12417,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "64687616"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892202.240, "dur": 0.299, "args": { "External id": 12418,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "65211904"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892207.452, "dur": 0.155, "args": { "External id": 12419,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "65212160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892210.900, "dur": 1.242, "args": { "External id": 12420,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "66653952"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892213.626, "dur": 0.160, "args": { "External id": 12421,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "68095744"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892214.805, "dur": 2.330, "args": { "External id": 12422,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "69537536"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892218.626, "dur": 0.326, "args": { "External id": 12423,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "69537792"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892219.967, "dur": 0.190, "args": { "External id": 12424,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "70062080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892223.721, "dur": 0.325, "args": { "External id": 12425,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "70586368"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892224.998, "dur": 0.303, "args": { "External id": 12426,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "71110656"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892226.131, "dur": 0.158, "args": { "External id": 12427,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "71634944"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892244.265, "dur": 1.393, "args": { "External id": 12428,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "71635200"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892247.179, "dur": 0.307, "args": { "External id": 12429,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "73076992"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892248.361, "dur": 2.156, "args": { "External id": 12430,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "74518784"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892251.935, "dur": 0.263, "args": { "External id": 12431,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "75960576"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649892253.626, "dur": 0.253, "args": { "External id": 12432,"Record function id": 0, "Concrete Inputs": ["", "[8192000]", "[1]", "75960832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[42076416], [], [], []], "Ev Idx": 5927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649892285.874, "dur": 59.609, "args": { "External id": 12433,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 5928 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295649892417.658, "dur": 355.620, "args": { "External id": 12434,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[336611328], [42076416], [], [], []], "Ev Idx": 5929 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649892456.521, "dur": 312.210, "args": { "External id": 12435,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 336611328, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[42076416], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 5930, "In msg nelems": 42076416 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295649892468.895, "dur": 294.457, "args": { "External id": 12436,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[42076416]], "Ev Idx": 5931 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649892798.748, "dur": 2.332, "args": { "External id": 12437,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 5932, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out", "pid": 1336754, "tid": 1336754, "ts": 1295649892888.302, "dur": 8601.459, "args": { "External id": 12438,"Record function id": 0, "Ev Idx": 5933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893106.773, "dur": 6.889, "args": { "External id": 12439,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[336611328], []], "Ev Idx": 5934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893117.681, "dur": 0.897, "args": { "External id": 12440,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893120.294, "dur": 0.896, "args": { "External id": 12441,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893123.057, "dur": 1.915, "args": { "External id": 12442,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893128.293, "dur": 0.540, "args": { "External id": 12443,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893132.765, "dur": 0.579, "args": { "External id": 12444,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893135.173, "dur": 0.673, "args": { "External id": 12445,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893137.409, "dur": 1.671, "args": { "External id": 12446,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893140.921, "dur": 0.845, "args": { "External id": 12447,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893145.511, "dur": 0.597, "args": { "External id": 12448,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893148.086, "dur": 0.569, "args": { "External id": 12449,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893151.279, "dur": 1.461, "args": { "External id": 12450,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893154.534, "dur": 0.433, "args": { "External id": 12451,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893158.875, "dur": 0.621, "args": { "External id": 12452,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893161.425, "dur": 0.616, "args": { "External id": 12453,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893163.908, "dur": 1.717, "args": { "External id": 12454,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893167.185, "dur": 0.604, "args": { "External id": 12455,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893171.059, "dur": 0.664, "args": { "External id": 12456,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893173.483, "dur": 0.602, "args": { "External id": 12457,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893175.689, "dur": 1.728, "args": { "External id": 12458,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893178.879, "dur": 0.479, "args": { "External id": 12459,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893182.928, "dur": 0.589, "args": { "External id": 12460,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893185.528, "dur": 0.531, "args": { "External id": 12461,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893187.838, "dur": 1.812, "args": { "External id": 12462,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893197.602, "dur": 0.685, "args": { "External id": 12463,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893202.246, "dur": 0.697, "args": { "External id": 12464,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893204.559, "dur": 0.750, "args": { "External id": 12465,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893206.894, "dur": 1.624, "args": { "External id": 12466,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893209.810, "dur": 0.579, "args": { "External id": 12467,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893213.725, "dur": 0.596, "args": { "External id": 12468,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893215.621, "dur": 0.532, "args": { "External id": 12469,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893217.426, "dur": 1.636, "args": { "External id": 12470,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893220.513, "dur": 0.801, "args": { "External id": 12471,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893224.876, "dur": 0.879, "args": { "External id": 12472,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 5967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893243.465, "dur": 1.329, "args": { "External id": 12473,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893247.972, "dur": 1.960, "args": { "External id": 12474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893251.784, "dur": 0.442, "args": { "External id": 12475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893256.030, "dur": 0.437, "args": { "External id": 12476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 5971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893258.229, "dur": 0.458, "args": { "External id": 12477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 5972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649893260.083, "dur": 1.897, "args": { "External id": 12478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[65536000], []], "Ev Idx": 5973 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649893289.995, "dur": 8145.855, "args": { "External id": 12479,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649893316.079, "dur": 8110.195, "args": { "External id": 12480,"Record function id": 0, "Concrete Inputs": ["", "", "1", ""], "Input type": ["c10::BFloat16", "", "Scalar", "TensorList"], "Input Strides": [[42076416, 1], [], [], []], "Input Dims": [[8, 42076416], [], [], []], "Ev Idx": 5975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649893347.403, "dur": 6.052, "args": { "External id": 12481,"Record function id": 0, "Concrete Inputs": ["[4290]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649893361.058, "dur": 8022.720, "args": { "External id": 12482,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], [], []], "Ev Idx": 5977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649893364.042, "dur": 8018.997, "args": { "External id": 12483,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[4290], [], [], [], [], [], []], "Ev Idx": 5978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649893371.900, "dur": 6.359, "args": { "External id": 12484,"Record function id": 0, "Concrete Inputs": ["[4290]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649893380.065, "dur": 7999.682, "args": { "External id": 12485,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[4290], [4290], []], "Ev Idx": 5980 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295649901738.396, "dur": 40.404, "args": { "External id": 12486,"Record function id": 0, "Ev Idx": 5981 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 0/0", "pid": 1336754, "tid": 1336754, "ts": 1295649901780.480, "dur": 258.168, "args": { "External id": 12487,"Record function id": 0, "Ev Idx": 5982 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649901824.291, "dur": 203.602, "args": { "External id": 12488,"Sequence number": 246540, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "long int"], "Input Strides": [[2048, 1], [4096, 1]], "Input Dims": [[32000, 2048], [16, 4096]], "Ev Idx": 5983 } }, { "ph": "s", "id": 228, "pid": 1336754, "tid": 1336754, "ts": 1295649901824.291, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_embedding_0", "pid": 1336754, "tid": 1336754, "ts": 1295649901903.218, "dur": 52.136, "args": { "External id": 12489,"kernel_hash": "c5wemnzn2hvtwjoj3icw7tagar3wjyj7c7i5vhvuszrcw63rsbhp", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/5w/c5wemnzn2hvtwjoj3icw7tagar3wjyj7c7i5vhvuszrcw63rsbhp.py", "kernel_backend": "triton", "Input type": ["long int", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[4096, 1], [2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096], [32000, 2048], [16, 4096, 2048], []], "Ev Idx": 5984 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295649902106.346, "dur": 55.971, "args": { "External id": 12490,"Record function id": 0, "Ev Idx": 5985 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.0)", "pid": 1336754, "tid": 1336754, "ts": 1295649902172.471, "dur": 6934.766, "args": { "External id": 12491,"Record function id": 0, "Ev Idx": 5986 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.0)", "pid": 1336754, "tid": 1336754, "ts": 1295649902181.558, "dur": 762.394, "args": { "External id": 12492,"Record function id": 0, "Ev Idx": 5987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649902269.763, "dur": 12.355, "args": { "External id": 12493,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 5988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649902296.775, "dur": 41.085, "args": { "External id": 12494,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 5989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902304.456, "dur": 2.616, "args": { "External id": 12495,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902309.442, "dur": 0.471, "args": { "External id": 12496,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902311.701, "dur": 3.103, "args": { "External id": 12497,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902316.321, "dur": 0.526, "args": { "External id": 12498,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902318.561, "dur": 0.160, "args": { "External id": 12499,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902322.696, "dur": 0.191, "args": { "External id": 12500,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902324.708, "dur": 0.183, "args": { "External id": 12501,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902326.261, "dur": 1.726, "args": { "External id": 12502,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902331.193, "dur": 0.364, "args": { "External id": 12503,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 5998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649902349.021, "dur": 37.323, "args": { "External id": 12504,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 5999 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295649902420.033, "dur": 106.716, "args": { "External id": 12505,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649902431.797, "dur": 3.799, "args": { "External id": 12506,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295649902440.911, "dur": 10.817, "args": { "External id": 12507,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649902445.828, "dur": 5.494, "args": { "External id": 12508,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902449.591, "dur": 0.580, "args": { "External id": 12509,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649902458.436, "dur": 28.046, "args": { "External id": 12510,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902461.030, "dur": 0.442, "args": { "External id": 12511,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902463.081, "dur": 0.428, "args": { "External id": 12512,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902467.392, "dur": 0.388, "args": { "External id": 12513,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902468.918, "dur": 0.350, "args": { "External id": 12514,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902470.768, "dur": 2.605, "args": { "External id": 12515,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902474.810, "dur": 0.292, "args": { "External id": 12516,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902476.541, "dur": 0.341, "args": { "External id": 12517,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902480.846, "dur": 0.491, "args": { "External id": 12518,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649902482.742, "dur": 0.290, "args": { "External id": 12519,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649902497.191, "dur": 21.681, "args": { "External id": 12520,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6015 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295649902578.486, "dur": 282.976, "args": { "External id": 12521,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6016 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649902610.631, "dur": 246.182, "args": { "External id": 12522,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6017, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295649902620.571, "dur": 230.872, "args": { "External id": 12523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6018 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649902883.096, "dur": 2.232, "args": { "External id": 12524,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6019, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.0)", "pid": 1336754, "tid": 1336754, "ts": 1295649902963.351, "dur": 5881.913, "args": { "External id": 12525,"Record function id": 0, "Ev Idx": 6020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903097.842, "dur": 6.670, "args": { "External id": 12526,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903108.310, "dur": 0.989, "args": { "External id": 12527,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903111.019, "dur": 0.792, "args": { "External id": 12528,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903115.603, "dur": 2.056, "args": { "External id": 12529,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903118.979, "dur": 1.047, "args": { "External id": 12530,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903121.303, "dur": 0.573, "args": { "External id": 12531,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903124.460, "dur": 0.910, "args": { "External id": 12532,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903128.756, "dur": 1.768, "args": { "External id": 12533,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903132.559, "dur": 0.628, "args": { "External id": 12534,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649903134.690, "dur": 0.619, "args": { "External id": 12535,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6030 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649903154.114, "dur": 5655.996, "args": { "External id": 12536,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649903171.008, "dur": 5632.396, "args": { "External id": 12537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649903193.689, "dur": 13.248, "args": { "External id": 12538,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649903212.428, "dur": 5557.069, "args": { "External id": 12539,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649903214.884, "dur": 5554.066, "args": { "External id": 12540,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649903221.123, "dur": 5.802, "args": { "External id": 12541,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649903245.972, "dur": 5519.897, "args": { "External id": 12542,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6037 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649908978.729, "dur": 102.310, "args": { "External id": 12543,"Sequence number": 246541, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6038 } }, { "ph": "s", "id": 227, "pid": 1336754, "tid": 1336754, "ts": 1295649908978.729, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295649909068.395, "dur": 7.484, "args": { "External id": 12544,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649909071.143, "dur": 4.451, "args": { "External id": 12545,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6040 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295649909148.216, "dur": 103.120, "args": { "External id": 12546,"Record function id": 0, "Ev Idx": 6041 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295649909254.714, "dur": 1196.020, "args": { "External id": 12547,"Record function id": 0, "Ev Idx": 6042 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649909296.764, "dur": 1140.414, "args": { "External id": 12548,"Sequence number": 246542, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6043 } }, { "ph": "s", "id": 226, "pid": 1336754, "tid": 1336754, "ts": 1295649909296.764, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295649909369.791, "dur": 50.082, "args": { "External id": 12549,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649909432.812, "dur": 106.264, "args": { "External id": 12550,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649909550.688, "dur": 40.594, "args": { "External id": 12551,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649909599.473, "dur": 32.594, "args": { "External id": 12552,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6047 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649909657.158, "dur": 28.962, "args": { "External id": 12553,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6048 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649909705.699, "dur": 17.857, "args": { "External id": 12554,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6049 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295649909742.959, "dur": 129.029, "args": { "External id": 12555,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295649909796.371, "dur": 10.673, "args": { "External id": 12556,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649909801.425, "dur": 4.849, "args": { "External id": 12557,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649909810.001, "dur": 3.307, "args": { "External id": 12558,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649909814.777, "dur": 0.980, "args": { "External id": 12559,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649909818.050, "dur": 2.611, "args": { "External id": 12560,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649909882.085, "dur": 45.602, "args": { "External id": 12561,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6056 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295649909958.394, "dur": 114.481, "args": { "External id": 12562,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649910084.884, "dur": 49.288, "args": { "External id": 12563,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649910143.477, "dur": 35.568, "args": { "External id": 12564,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6059 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295649910202.569, "dur": 64.113, "args": { "External id": 12565,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649910274.394, "dur": 41.225, "args": { "External id": 12566,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6061 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295649910343.584, "dur": 19.648, "args": { "External id": 12567,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6062 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.0)", "pid": 1336754, "tid": 1336754, "ts": 1295649910516.188, "dur": 78.252, "args": { "External id": 12568,"Record function id": 0, "Ev Idx": 6063 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295649910665.905, "dur": 46.828, "args": { "External id": 12569,"Record function id": 0, "Ev Idx": 6064 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.1)", "pid": 1336754, "tid": 1336754, "ts": 1295649910721.816, "dur": 19376.493, "args": { "External id": 12570,"Record function id": 0, "Ev Idx": 6065 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.1)", "pid": 1336754, "tid": 1336754, "ts": 1295649910730.898, "dur": 966.973, "args": { "External id": 12571,"Record function id": 0, "Ev Idx": 6066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649910805.783, "dur": 8.498, "args": { "External id": 12572,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649910827.773, "dur": 33.791, "args": { "External id": 12573,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910832.802, "dur": 3.738, "args": { "External id": 12574,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910838.315, "dur": 0.645, "args": { "External id": 12575,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910840.181, "dur": 0.536, "args": { "External id": 12576,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910844.520, "dur": 0.180, "args": { "External id": 12577,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910845.613, "dur": 1.542, "args": { "External id": 12578,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910848.211, "dur": 0.193, "args": { "External id": 12579,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910850.281, "dur": 0.498, "args": { "External id": 12580,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910851.712, "dur": 0.310, "args": { "External id": 12581,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910852.932, "dur": 2.752, "args": { "External id": 12582,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649910871.787, "dur": 39.259, "args": { "External id": 12583,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6078 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295649910942.687, "dur": 181.441, "args": { "External id": 12584,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649910953.474, "dur": 3.599, "args": { "External id": 12585,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295649910962.429, "dur": 10.263, "args": { "External id": 12586,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649910967.161, "dur": 5.111, "args": { "External id": 12587,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910970.281, "dur": 0.623, "args": { "External id": 12588,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649910979.350, "dur": 90.122, "args": { "External id": 12589,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649910981.089, "dur": 61.721, "args": { "External id": 12590,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911046.281, "dur": 1.518, "args": { "External id": 12591,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911048.983, "dur": 3.291, "args": { "External id": 12592,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911053.343, "dur": 0.569, "args": { "External id": 12593,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911054.880, "dur": 0.370, "args": { "External id": 12594,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911058.551, "dur": 0.193, "args": { "External id": 12595,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911059.775, "dur": 0.305, "args": { "External id": 12596,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911061.013, "dur": 0.159, "args": { "External id": 12597,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911064.535, "dur": 0.151, "args": { "External id": 12598,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649911085.256, "dur": 28.611, "args": { "External id": 12599,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6094 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295649911179.838, "dur": 420.259, "args": { "External id": 12600,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6095 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649911265.367, "dur": 329.963, "args": { "External id": 12601,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6096, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295649911277.110, "dur": 312.841, "args": { "External id": 12602,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6097 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649911626.811, "dur": 2.330, "args": { "External id": 12603,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6098, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.1)", "pid": 1336754, "tid": 1336754, "ts": 1295649911718.643, "dur": 18156.503, "args": { "External id": 12604,"Record function id": 0, "Ev Idx": 6099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911811.296, "dur": 6.648, "args": { "External id": 12605,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911821.606, "dur": 0.998, "args": { "External id": 12606,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911824.408, "dur": 0.902, "args": { "External id": 12607,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911827.337, "dur": 0.828, "args": { "External id": 12608,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911829.459, "dur": 1.318, "args": { "External id": 12609,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911834.452, "dur": 0.705, "args": { "External id": 12610,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911836.742, "dur": 0.618, "args": { "External id": 12611,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911838.686, "dur": 3.188, "args": { "External id": 12612,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911843.888, "dur": 0.709, "args": { "External id": 12613,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649911848.578, "dur": 0.584, "args": { "External id": 12614,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6109 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649911867.553, "dur": 17969.210, "args": { "External id": 12615,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649911883.168, "dur": 17946.624, "args": { "External id": 12616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649911903.043, "dur": 14.199, "args": { "External id": 12617,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649911920.378, "dur": 17874.747, "args": { "External id": 12618,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649911922.988, "dur": 17871.397, "args": { "External id": 12619,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649911929.141, "dur": 5.149, "args": { "External id": 12620,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649911936.350, "dur": 17854.611, "args": { "External id": 12621,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6116 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649930033.091, "dur": 39.068, "args": { "External id": 12622,"Sequence number": 246543, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6117 } }, { "ph": "s", "id": 225, "pid": 1336754, "tid": 1336754, "ts": 1295649930033.091, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295649930058.212, "dur": 8.787, "args": { "External id": 12623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649930061.948, "dur": 4.703, "args": { "External id": 12624,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6119 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295649930139.606, "dur": 79.215, "args": { "External id": 12625,"Record function id": 0, "Ev Idx": 6120 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295649930220.471, "dur": 1127.358, "args": { "External id": 12626,"Record function id": 0, "Ev Idx": 6121 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649930279.687, "dur": 1054.440, "args": { "External id": 12627,"Sequence number": 246544, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6122 } }, { "ph": "s", "id": 224, "pid": 1336754, "tid": 1336754, "ts": 1295649930279.687, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295649930353.758, "dur": 48.189, "args": { "External id": 12628,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649930417.165, "dur": 105.304, "args": { "External id": 12629,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649930530.786, "dur": 38.978, "args": { "External id": 12630,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649930575.713, "dur": 31.000, "args": { "External id": 12631,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6126 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649930635.934, "dur": 28.804, "args": { "External id": 12632,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6127 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649930680.131, "dur": 19.498, "args": { "External id": 12633,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6128 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295649930714.216, "dur": 128.397, "args": { "External id": 12634,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295649930761.814, "dur": 12.624, "args": { "External id": 12635,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649930766.770, "dur": 6.931, "args": { "External id": 12636,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649930777.406, "dur": 4.668, "args": { "External id": 12637,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649930783.688, "dur": 3.096, "args": { "External id": 12638,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649930789.038, "dur": 3.186, "args": { "External id": 12639,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649930853.701, "dur": 46.804, "args": { "External id": 12640,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6135 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295649930930.939, "dur": 28.923, "args": { "External id": 12641,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649930968.332, "dur": 95.999, "args": { "External id": 12642,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649931074.693, "dur": 38.150, "args": { "External id": 12643,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6138 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295649931141.283, "dur": 27.409, "args": { "External id": 12644,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649931174.505, "dur": 35.165, "args": { "External id": 12645,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6140 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295649931243.189, "dur": 26.385, "args": { "External id": 12646,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6141 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.1)", "pid": 1336754, "tid": 1336754, "ts": 1295649931412.782, "dur": 73.659, "args": { "External id": 12647,"Record function id": 0, "Ev Idx": 6142 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295649931557.514, "dur": 45.719, "args": { "External id": 12648,"Record function id": 0, "Ev Idx": 6143 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.2)", "pid": 1336754, "tid": 1336754, "ts": 1295649931611.790, "dur": 18478.504, "args": { "External id": 12649,"Record function id": 0, "Ev Idx": 6144 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.2)", "pid": 1336754, "tid": 1336754, "ts": 1295649931620.402, "dur": 909.224, "args": { "External id": 12650,"Record function id": 0, "Ev Idx": 6145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649931695.711, "dur": 8.289, "args": { "External id": 12651,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649931717.861, "dur": 38.130, "args": { "External id": 12652,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931723.287, "dur": 2.303, "args": { "External id": 12653,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931729.999, "dur": 0.640, "args": { "External id": 12654,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931731.619, "dur": 0.653, "args": { "External id": 12655,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931733.669, "dur": 0.769, "args": { "External id": 12656,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931738.106, "dur": 0.669, "args": { "External id": 12657,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931739.881, "dur": 0.701, "args": { "External id": 12658,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931741.706, "dur": 4.520, "args": { "External id": 12659,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931747.456, "dur": 0.579, "args": { "External id": 12660,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931749.225, "dur": 0.515, "args": { "External id": 12661,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649931766.783, "dur": 38.248, "args": { "External id": 12662,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6157 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295649931836.626, "dur": 109.283, "args": { "External id": 12663,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649931849.365, "dur": 4.220, "args": { "External id": 12664,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295649931858.766, "dur": 10.247, "args": { "External id": 12665,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649931863.403, "dur": 5.197, "args": { "External id": 12666,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931867.032, "dur": 0.478, "args": { "External id": 12667,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649931875.978, "dur": 30.404, "args": { "External id": 12668,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931878.010, "dur": 3.241, "args": { "External id": 12669,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931882.525, "dur": 0.722, "args": { "External id": 12670,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931884.435, "dur": 0.845, "args": { "External id": 12671,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931889.127, "dur": 2.630, "args": { "External id": 12672,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931892.916, "dur": 0.727, "args": { "External id": 12673,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931895.057, "dur": 0.762, "args": { "External id": 12674,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931897.049, "dur": 0.584, "args": { "External id": 12675,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931898.689, "dur": 0.629, "args": { "External id": 12676,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649931900.484, "dur": 2.291, "args": { "External id": 12677,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649931917.019, "dur": 22.088, "args": { "External id": 12678,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6173 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295649932043.771, "dur": 385.137, "args": { "External id": 12679,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6174 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649932076.119, "dur": 347.653, "args": { "External id": 12680,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6175, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295649932089.429, "dur": 327.897, "args": { "External id": 12681,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6176 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649932456.029, "dur": 2.274, "args": { "External id": 12682,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6177, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.2)", "pid": 1336754, "tid": 1336754, "ts": 1295649932550.621, "dur": 17325.285, "args": { "External id": 12683,"Record function id": 0, "Ev Idx": 6178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932645.840, "dur": 7.011, "args": { "External id": 12684,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932657.033, "dur": 1.677, "args": { "External id": 12685,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932660.559, "dur": 2.001, "args": { "External id": 12686,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932664.161, "dur": 0.824, "args": { "External id": 12687,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932666.314, "dur": 1.028, "args": { "External id": 12688,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932668.591, "dur": 1.021, "args": { "External id": 12689,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932673.992, "dur": 0.975, "args": { "External id": 12690,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932676.945, "dur": 1.623, "args": { "External id": 12691,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932680.031, "dur": 0.716, "args": { "External id": 12692,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649932682.442, "dur": 0.849, "args": { "External id": 12693,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6188 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649932703.550, "dur": 17133.384, "args": { "External id": 12694,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649932719.849, "dur": 17110.399, "args": { "External id": 12695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649932740.183, "dur": 13.390, "args": { "External id": 12696,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649932756.773, "dur": 17038.556, "args": { "External id": 12697,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649932759.500, "dur": 17035.302, "args": { "External id": 12698,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649932765.363, "dur": 5.209, "args": { "External id": 12699,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649932772.359, "dur": 17019.219, "args": { "External id": 12700,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6195 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649950027.364, "dur": 36.419, "args": { "External id": 12701,"Sequence number": 246545, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6196 } }, { "ph": "s", "id": 223, "pid": 1336754, "tid": 1336754, "ts": 1295649950027.364, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295649950051.224, "dur": 7.596, "args": { "External id": 12702,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649950054.086, "dur": 4.421, "args": { "External id": 12703,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6198 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295649950132.159, "dur": 78.212, "args": { "External id": 12704,"Record function id": 0, "Ev Idx": 6199 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295649950212.170, "dur": 1111.485, "args": { "External id": 12705,"Record function id": 0, "Ev Idx": 6200 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295649950268.990, "dur": 1040.002, "args": { "External id": 12706,"Sequence number": 246546, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6201 } }, { "ph": "s", "id": 222, "pid": 1336754, "tid": 1336754, "ts": 1295649950268.990, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295649950339.000, "dur": 45.226, "args": { "External id": 12707,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649950396.317, "dur": 105.457, "args": { "External id": 12708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649950511.878, "dur": 39.786, "args": { "External id": 12709,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649950561.190, "dur": 31.816, "args": { "External id": 12710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6205 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649950620.270, "dur": 26.098, "args": { "External id": 12711,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6206 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295649950665.319, "dur": 18.739, "args": { "External id": 12712,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6207 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295649950702.564, "dur": 128.727, "args": { "External id": 12713,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295649950752.982, "dur": 10.927, "args": { "External id": 12714,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649950757.783, "dur": 5.456, "args": { "External id": 12715,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649950766.471, "dur": 5.411, "args": { "External id": 12716,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649950773.476, "dur": 1.426, "args": { "External id": 12717,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649950777.081, "dur": 4.021, "args": { "External id": 12718,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649950841.812, "dur": 45.708, "args": { "External id": 12719,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6214 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295649950918.502, "dur": 29.382, "args": { "External id": 12720,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649950957.505, "dur": 82.765, "args": { "External id": 12721,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649951053.085, "dur": 38.648, "args": { "External id": 12722,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6217 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295649951116.318, "dur": 26.466, "args": { "External id": 12723,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295649951148.399, "dur": 34.490, "args": { "External id": 12724,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6219 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295649951205.373, "dur": 18.774, "args": { "External id": 12725,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6220 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.2)", "pid": 1336754, "tid": 1336754, "ts": 1295649951387.447, "dur": 74.740, "args": { "External id": 12726,"Record function id": 0, "Ev Idx": 6221 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295649951535.043, "dur": 46.434, "args": { "External id": 12727,"Record function id": 0, "Ev Idx": 6222 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.3)", "pid": 1336754, "tid": 1336754, "ts": 1295649951590.459, "dur": 85236.759, "args": { "External id": 12728,"Record function id": 0, "Ev Idx": 6223 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.3)", "pid": 1336754, "tid": 1336754, "ts": 1295649951600.261, "dur": 960.524, "args": { "External id": 12729,"Record function id": 0, "Ev Idx": 6224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649951676.591, "dur": 8.655, "args": { "External id": 12730,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649951698.795, "dur": 41.539, "args": { "External id": 12731,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951704.489, "dur": 2.073, "args": { "External id": 12732,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951711.503, "dur": 0.439, "args": { "External id": 12733,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951713.543, "dur": 0.540, "args": { "External id": 12734,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951720.595, "dur": 0.394, "args": { "External id": 12735,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951724.388, "dur": 0.581, "args": { "External id": 12736,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951726.543, "dur": 0.664, "args": { "External id": 12737,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951728.878, "dur": 2.953, "args": { "External id": 12738,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951733.108, "dur": 0.172, "args": { "External id": 12739,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951734.661, "dur": 0.275, "args": { "External id": 12740,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649951751.738, "dur": 42.398, "args": { "External id": 12741,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6236 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295649951826.235, "dur": 116.628, "args": { "External id": 12742,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649951837.278, "dur": 3.331, "args": { "External id": 12743,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295649951845.470, "dur": 10.103, "args": { "External id": 12744,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295649951850.229, "dur": 4.916, "args": { "External id": 12745,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951853.361, "dur": 0.646, "args": { "External id": 12746,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295649951862.387, "dur": 30.104, "args": { "External id": 12747,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951864.168, "dur": 2.506, "args": { "External id": 12748,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951868.024, "dur": 0.399, "args": { "External id": 12749,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951869.971, "dur": 0.325, "args": { "External id": 12750,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951873.640, "dur": 1.457, "args": { "External id": 12751,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951876.748, "dur": 0.331, "args": { "External id": 12752,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951878.664, "dur": 0.478, "args": { "External id": 12753,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951882.946, "dur": 0.326, "args": { "External id": 12754,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951884.455, "dur": 0.158, "args": { "External id": 12755,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649951886.214, "dur": 2.565, "args": { "External id": 12756,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649951914.008, "dur": 21.614, "args": { "External id": 12757,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6252 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295649952040.643, "dur": 417.600, "args": { "External id": 12758,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6253 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649952072.591, "dur": 379.980, "args": { "External id": 12759,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6254, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295649952088.071, "dur": 358.309, "args": { "External id": 12760,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6255 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295649952484.984, "dur": 2.546, "args": { "External id": 12761,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6256, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.3)", "pid": 1336754, "tid": 1336754, "ts": 1295649952582.153, "dur": 84041.099, "args": { "External id": 12762,"Record function id": 0, "Ev Idx": 6257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952674.015, "dur": 6.665, "args": { "External id": 12763,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952683.872, "dur": 1.412, "args": { "External id": 12764,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952687.074, "dur": 2.035, "args": { "External id": 12765,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952691.253, "dur": 0.880, "args": { "External id": 12766,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952693.404, "dur": 1.148, "args": { "External id": 12767,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952695.873, "dur": 0.843, "args": { "External id": 12768,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952701.027, "dur": 0.922, "args": { "External id": 12769,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952703.692, "dur": 2.048, "args": { "External id": 12770,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952707.143, "dur": 0.474, "args": { "External id": 12771,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295649952709.529, "dur": 0.587, "args": { "External id": 12772,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6267 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649952730.790, "dur": 83849.656, "args": { "External id": 12773,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649952747.247, "dur": 83825.706, "args": { "External id": 12774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295649952766.358, "dur": 15.493, "args": { "External id": 12775,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295649952785.013, "dur": 83749.802, "args": { "External id": 12776,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295649952787.802, "dur": 83746.361, "args": { "External id": 12777,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295649952794.096, "dur": 5.872, "args": { "External id": 12778,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295649952801.786, "dur": 83728.874, "args": { "External id": 12779,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6274 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650036755.013, "dur": 47.726, "args": { "External id": 12780,"Sequence number": 246547, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6275 } }, { "ph": "s", "id": 221, "pid": 1336754, "tid": 1336754, "ts": 1295650036755.013, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650036789.788, "dur": 8.010, "args": { "External id": 12781,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650036793.127, "dur": 4.500, "args": { "External id": 12782,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6277 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650036867.913, "dur": 82.264, "args": { "External id": 12783,"Record function id": 0, "Ev Idx": 6278 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650036951.854, "dur": 1160.539, "args": { "External id": 12784,"Record function id": 0, "Ev Idx": 6279 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650037022.492, "dur": 1076.069, "args": { "External id": 12785,"Sequence number": 246548, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6280 } }, { "ph": "s", "id": 220, "pid": 1336754, "tid": 1336754, "ts": 1295650037022.492, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650037092.970, "dur": 47.309, "args": { "External id": 12786,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037152.442, "dur": 109.731, "args": { "External id": 12787,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037277.392, "dur": 43.479, "args": { "External id": 12788,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037328.064, "dur": 31.530, "args": { "External id": 12789,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6284 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650037392.132, "dur": 30.585, "args": { "External id": 12790,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6285 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650037439.529, "dur": 15.831, "args": { "External id": 12791,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6286 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650037474.496, "dur": 132.315, "args": { "External id": 12792,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650037524.616, "dur": 11.862, "args": { "External id": 12793,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650037529.556, "dur": 6.190, "args": { "External id": 12794,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650037539.237, "dur": 5.733, "args": { "External id": 12795,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650037546.294, "dur": 1.571, "args": { "External id": 12796,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650037552.748, "dur": 4.423, "args": { "External id": 12797,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037617.500, "dur": 50.769, "args": { "External id": 12798,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6293 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650037699.803, "dur": 31.126, "args": { "External id": 12799,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037740.724, "dur": 43.162, "args": { "External id": 12800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037819.540, "dur": 36.524, "args": { "External id": 12801,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6296 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650037883.630, "dur": 25.495, "args": { "External id": 12802,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650037914.653, "dur": 36.477, "args": { "External id": 12803,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6298 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650037969.664, "dur": 58.960, "args": { "External id": 12804,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6299 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.3)", "pid": 1336754, "tid": 1336754, "ts": 1295650038178.096, "dur": 95.504, "args": { "External id": 12805,"Record function id": 0, "Ev Idx": 6300 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650038349.419, "dur": 46.718, "args": { "External id": 12806,"Record function id": 0, "Ev Idx": 6301 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.4)", "pid": 1336754, "tid": 1336754, "ts": 1295650038404.425, "dur": 19259.059, "args": { "External id": 12807,"Record function id": 0, "Ev Idx": 6302 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.4)", "pid": 1336754, "tid": 1336754, "ts": 1295650038413.949, "dur": 907.237, "args": { "External id": 12808,"Record function id": 0, "Ev Idx": 6303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650038491.197, "dur": 9.337, "args": { "External id": 12809,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650038514.765, "dur": 37.614, "args": { "External id": 12810,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038520.428, "dur": 2.415, "args": { "External id": 12811,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038528.183, "dur": 0.460, "args": { "External id": 12812,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038529.890, "dur": 0.187, "args": { "External id": 12813,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038531.542, "dur": 0.625, "args": { "External id": 12814,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038535.229, "dur": 0.430, "args": { "External id": 12815,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038537.180, "dur": 0.552, "args": { "External id": 12816,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038538.769, "dur": 3.985, "args": { "External id": 12817,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038544.260, "dur": 0.630, "args": { "External id": 12818,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038545.668, "dur": 0.494, "args": { "External id": 12819,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650038563.133, "dur": 43.127, "args": { "External id": 12820,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6315 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650038637.979, "dur": 106.998, "args": { "External id": 12821,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650038648.256, "dur": 4.595, "args": { "External id": 12822,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650038657.782, "dur": 10.137, "args": { "External id": 12823,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650038662.375, "dur": 5.159, "args": { "External id": 12824,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038665.800, "dur": 0.552, "args": { "External id": 12825,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650038674.174, "dur": 30.166, "args": { "External id": 12826,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038676.150, "dur": 2.696, "args": { "External id": 12827,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038680.381, "dur": 0.643, "args": { "External id": 12828,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038682.214, "dur": 0.211, "args": { "External id": 12829,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038686.607, "dur": 2.066, "args": { "External id": 12830,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038690.102, "dur": 0.348, "args": { "External id": 12831,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038692.275, "dur": 0.344, "args": { "External id": 12832,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038694.064, "dur": 0.347, "args": { "External id": 12833,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038696.017, "dur": 0.194, "args": { "External id": 12834,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650038697.500, "dur": 2.506, "args": { "External id": 12835,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650038715.188, "dur": 21.797, "args": { "External id": 12836,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6331 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650038798.116, "dur": 405.116, "args": { "External id": 12837,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6332 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650038829.622, "dur": 368.138, "args": { "External id": 12838,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6333, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650038841.917, "dur": 349.275, "args": { "External id": 12839,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6334 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650039245.627, "dur": 3.243, "args": { "External id": 12840,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6335, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.4)", "pid": 1336754, "tid": 1336754, "ts": 1295650039342.318, "dur": 18129.413, "args": { "External id": 12841,"Record function id": 0, "Ev Idx": 6336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039441.702, "dur": 6.711, "args": { "External id": 12842,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039451.933, "dur": 1.068, "args": { "External id": 12843,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039454.778, "dur": 2.144, "args": { "External id": 12844,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039458.823, "dur": 0.855, "args": { "External id": 12845,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039461.018, "dur": 1.158, "args": { "External id": 12846,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039463.498, "dur": 0.597, "args": { "External id": 12847,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039468.230, "dur": 1.073, "args": { "External id": 12848,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039471.008, "dur": 2.166, "args": { "External id": 12849,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039474.488, "dur": 0.754, "args": { "External id": 12850,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650039477.144, "dur": 0.700, "args": { "External id": 12851,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6346 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650039498.095, "dur": 17935.045, "args": { "External id": 12852,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650039514.556, "dur": 17911.845, "args": { "External id": 12853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650039537.502, "dur": 14.508, "args": { "External id": 12854,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650039555.246, "dur": 17836.521, "args": { "External id": 12855,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650039557.722, "dur": 17833.401, "args": { "External id": 12856,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650039563.963, "dur": 5.489, "args": { "External id": 12857,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650039571.243, "dur": 17816.545, "args": { "External id": 12858,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6353 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650057601.341, "dur": 36.415, "args": { "External id": 12859,"Sequence number": 246549, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6354 } }, { "ph": "s", "id": 219, "pid": 1336754, "tid": 1336754, "ts": 1295650057601.341, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650057624.570, "dur": 8.019, "args": { "External id": 12860,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650057628.060, "dur": 4.309, "args": { "External id": 12861,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6356 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650057704.391, "dur": 74.631, "args": { "External id": 12862,"Record function id": 0, "Ev Idx": 6357 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650057780.790, "dur": 1086.887, "args": { "External id": 12863,"Record function id": 0, "Ev Idx": 6358 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650057820.897, "dur": 1033.719, "args": { "External id": 12864,"Sequence number": 246550, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6359 } }, { "ph": "s", "id": 218, "pid": 1336754, "tid": 1336754, "ts": 1295650057820.897, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650057886.208, "dur": 42.172, "args": { "External id": 12865,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650057941.491, "dur": 132.626, "args": { "External id": 12866,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058088.672, "dur": 42.306, "args": { "External id": 12867,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058140.786, "dur": 31.137, "args": { "External id": 12868,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6363 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650058199.385, "dur": 41.877, "args": { "External id": 12869,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6364 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650058263.761, "dur": 18.705, "args": { "External id": 12870,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6365 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650058301.018, "dur": 134.382, "args": { "External id": 12871,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650058353.181, "dur": 12.261, "args": { "External id": 12872,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650058358.096, "dur": 6.452, "args": { "External id": 12873,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650058368.331, "dur": 5.932, "args": { "External id": 12874,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650058375.953, "dur": 1.308, "args": { "External id": 12875,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650058379.861, "dur": 4.373, "args": { "External id": 12876,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058445.788, "dur": 51.893, "args": { "External id": 12877,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6372 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650058530.160, "dur": 28.324, "args": { "External id": 12878,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058567.672, "dur": 41.649, "args": { "External id": 12879,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058618.051, "dur": 34.361, "args": { "External id": 12880,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6375 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650058677.234, "dur": 28.002, "args": { "External id": 12881,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650058711.077, "dur": 34.360, "args": { "External id": 12882,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6377 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650058766.583, "dur": 18.728, "args": { "External id": 12883,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6378 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.4)", "pid": 1336754, "tid": 1336754, "ts": 1295650058929.711, "dur": 117.085, "args": { "External id": 12884,"Record function id": 0, "Ev Idx": 6379 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650059126.746, "dur": 48.003, "args": { "External id": 12885,"Record function id": 0, "Ev Idx": 6380 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.5)", "pid": 1336754, "tid": 1336754, "ts": 1295650059184.121, "dur": 18993.401, "args": { "External id": 12886,"Record function id": 0, "Ev Idx": 6381 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.5)", "pid": 1336754, "tid": 1336754, "ts": 1295650059194.102, "dur": 911.513, "args": { "External id": 12887,"Record function id": 0, "Ev Idx": 6382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650059290.367, "dur": 9.568, "args": { "External id": 12888,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650059314.826, "dur": 39.793, "args": { "External id": 12889,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059320.928, "dur": 2.448, "args": { "External id": 12890,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059328.346, "dur": 0.253, "args": { "External id": 12891,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059330.374, "dur": 0.469, "args": { "External id": 12892,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059332.261, "dur": 0.692, "args": { "External id": 12893,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059336.484, "dur": 0.236, "args": { "External id": 12894,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059337.905, "dur": 0.842, "args": { "External id": 12895,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059340.028, "dur": 3.735, "args": { "External id": 12896,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059345.063, "dur": 0.397, "args": { "External id": 12897,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059347.528, "dur": 0.550, "args": { "External id": 12898,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650059366.170, "dur": 41.915, "args": { "External id": 12899,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6394 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650059441.672, "dur": 113.230, "args": { "External id": 12900,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650059452.435, "dur": 4.118, "args": { "External id": 12901,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650059461.602, "dur": 9.987, "args": { "External id": 12902,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650059466.105, "dur": 5.062, "args": { "External id": 12903,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059469.440, "dur": 0.627, "args": { "External id": 12904,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650059478.669, "dur": 32.506, "args": { "External id": 12905,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059480.713, "dur": 3.152, "args": { "External id": 12906,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059485.445, "dur": 0.334, "args": { "External id": 12907,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059487.797, "dur": 0.460, "args": { "External id": 12908,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059492.140, "dur": 1.989, "args": { "External id": 12909,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059495.691, "dur": 0.362, "args": { "External id": 12910,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059497.408, "dur": 0.355, "args": { "External id": 12911,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059501.941, "dur": 0.162, "args": { "External id": 12912,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059503.286, "dur": 0.161, "args": { "External id": 12913,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650059505.165, "dur": 2.345, "args": { "External id": 12914,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650059524.729, "dur": 22.663, "args": { "External id": 12915,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6410 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650059610.244, "dur": 357.586, "args": { "External id": 12916,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6411 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650059641.800, "dur": 321.283, "args": { "External id": 12917,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6412, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650059654.693, "dur": 300.289, "args": { "External id": 12918,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6413 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650060029.775, "dur": 3.605, "args": { "External id": 12919,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6414, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.5)", "pid": 1336754, "tid": 1336754, "ts": 1295650060126.572, "dur": 17816.676, "args": { "External id": 12920,"Record function id": 0, "Ev Idx": 6415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060225.101, "dur": 21.550, "args": { "External id": 12921,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060252.650, "dur": 1.204, "args": { "External id": 12922,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060255.794, "dur": 2.696, "args": { "External id": 12923,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060260.271, "dur": 0.993, "args": { "External id": 12924,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060262.514, "dur": 0.954, "args": { "External id": 12925,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060265.192, "dur": 0.766, "args": { "External id": 12926,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060269.655, "dur": 0.775, "args": { "External id": 12927,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060272.123, "dur": 2.136, "args": { "External id": 12928,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060275.543, "dur": 0.668, "args": { "External id": 12929,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650060277.779, "dur": 0.455, "args": { "External id": 12930,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6425 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650060299.753, "dur": 17604.114, "args": { "External id": 12931,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650060323.138, "dur": 17573.996, "args": { "External id": 12932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650060342.679, "dur": 14.705, "args": { "External id": 12933,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650060360.622, "dur": 17501.520, "args": { "External id": 12934,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650060363.233, "dur": 17498.273, "args": { "External id": 12935,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650060369.651, "dur": 6.170, "args": { "External id": 12936,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650060377.844, "dur": 17480.562, "args": { "External id": 12937,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6432 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650078113.493, "dur": 37.750, "args": { "External id": 12938,"Sequence number": 246551, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6433 } }, { "ph": "s", "id": 217, "pid": 1336754, "tid": 1336754, "ts": 1295650078113.493, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650078137.787, "dur": 8.597, "args": { "External id": 12939,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650078141.603, "dur": 4.488, "args": { "External id": 12940,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6435 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650078217.377, "dur": 90.418, "args": { "External id": 12941,"Record function id": 0, "Ev Idx": 6436 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650078310.707, "dur": 1127.837, "args": { "External id": 12942,"Record function id": 0, "Ev Idx": 6437 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650078353.731, "dur": 1071.040, "args": { "External id": 12943,"Sequence number": 246552, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6438 } }, { "ph": "s", "id": 216, "pid": 1336754, "tid": 1336754, "ts": 1295650078353.731, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650078423.892, "dur": 47.201, "args": { "External id": 12944,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650078484.265, "dur": 105.206, "args": { "External id": 12945,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650078600.224, "dur": 39.788, "args": { "External id": 12946,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650078649.395, "dur": 31.665, "args": { "External id": 12947,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6442 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650078707.408, "dur": 27.395, "args": { "External id": 12948,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6443 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650078753.807, "dur": 15.348, "args": { "External id": 12949,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6444 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650078791.725, "dur": 127.380, "args": { "External id": 12950,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650078840.526, "dur": 12.058, "args": { "External id": 12951,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650078845.713, "dur": 6.177, "args": { "External id": 12952,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650078855.279, "dur": 6.002, "args": { "External id": 12953,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650078863.058, "dur": 1.291, "args": { "External id": 12954,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650078866.546, "dur": 4.366, "args": { "External id": 12955,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650078929.728, "dur": 47.980, "args": { "External id": 12956,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6451 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650079055.780, "dur": 34.012, "args": { "External id": 12957,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650079100.307, "dur": 46.085, "args": { "External id": 12958,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650079156.264, "dur": 34.901, "args": { "External id": 12959,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6454 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650079214.053, "dur": 42.435, "args": { "External id": 12960,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650079263.977, "dur": 46.056, "args": { "External id": 12961,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6456 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650079334.871, "dur": 22.018, "args": { "External id": 12962,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6457 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.5)", "pid": 1336754, "tid": 1336754, "ts": 1295650079503.388, "dur": 73.870, "args": { "External id": 12963,"Record function id": 0, "Ev Idx": 6458 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650079650.807, "dur": 44.895, "args": { "External id": 12964,"Record function id": 0, "Ev Idx": 6459 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.6)", "pid": 1336754, "tid": 1336754, "ts": 1295650079704.524, "dur": 18833.642, "args": { "External id": 12965,"Record function id": 0, "Ev Idx": 6460 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.6)", "pid": 1336754, "tid": 1336754, "ts": 1295650079712.414, "dur": 902.352, "args": { "External id": 12966,"Record function id": 0, "Ev Idx": 6461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650079792.141, "dur": 8.342, "args": { "External id": 12967,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650079814.319, "dur": 38.930, "args": { "External id": 12968,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079820.354, "dur": 2.455, "args": { "External id": 12969,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079827.092, "dur": 0.433, "args": { "External id": 12970,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079829.592, "dur": 0.544, "args": { "External id": 12971,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079831.545, "dur": 0.324, "args": { "External id": 12972,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079835.433, "dur": 0.368, "args": { "External id": 12973,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079837.164, "dur": 0.373, "args": { "External id": 12974,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079839.169, "dur": 4.066, "args": { "External id": 12975,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079844.735, "dur": 0.433, "args": { "External id": 12976,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079846.900, "dur": 0.215, "args": { "External id": 12977,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650079864.834, "dur": 38.638, "args": { "External id": 12978,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6473 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650079934.203, "dur": 157.861, "args": { "External id": 12979,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650079945.191, "dur": 4.491, "args": { "External id": 12980,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650079954.625, "dur": 10.805, "args": { "External id": 12981,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650079959.220, "dur": 5.788, "args": { "External id": 12982,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079963.001, "dur": 0.770, "args": { "External id": 12983,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650079972.366, "dur": 73.816, "args": { "External id": 12984,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079974.571, "dur": 2.726, "args": { "External id": 12985,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650079978.818, "dur": 0.422, "args": { "External id": 12986,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080021.342, "dur": 0.825, "args": { "External id": 12987,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080027.171, "dur": 1.559, "args": { "External id": 12988,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080030.065, "dur": 0.401, "args": { "External id": 12989,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080032.312, "dur": 0.181, "args": { "External id": 12990,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080035.517, "dur": 0.397, "args": { "External id": 12991,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080037.757, "dur": 0.369, "args": { "External id": 12992,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080039.471, "dur": 2.019, "args": { "External id": 12993,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650080058.142, "dur": 25.792, "args": { "External id": 12994,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6489 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650080149.504, "dur": 368.125, "args": { "External id": 12995,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6490 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650080181.150, "dur": 331.512, "args": { "External id": 12996,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6491, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650080192.369, "dur": 314.127, "args": { "External id": 12997,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6492 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650080543.317, "dur": 2.506, "args": { "External id": 12998,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6493, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.6)", "pid": 1336754, "tid": 1336754, "ts": 1295650080636.749, "dur": 17713.876, "args": { "External id": 12999,"Record function id": 0, "Ev Idx": 6494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080732.898, "dur": 6.567, "args": { "External id": 13000,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080742.802, "dur": 0.959, "args": { "External id": 13001,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080745.538, "dur": 2.327, "args": { "External id": 13002,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080749.638, "dur": 0.685, "args": { "External id": 13003,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080751.958, "dur": 0.565, "args": { "External id": 13004,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080753.651, "dur": 0.930, "args": { "External id": 13005,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080758.523, "dur": 0.803, "args": { "External id": 13006,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080760.849, "dur": 2.212, "args": { "External id": 13007,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080764.575, "dur": 0.844, "args": { "External id": 13008,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650080766.570, "dur": 0.679, "args": { "External id": 13009,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6504 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650080785.941, "dur": 17525.050, "args": { "External id": 13010,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650080802.080, "dur": 17502.030, "args": { "External id": 13011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650080823.920, "dur": 15.585, "args": { "External id": 13012,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650080842.700, "dur": 17427.312, "args": { "External id": 13013,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650080845.344, "dur": 17424.075, "args": { "External id": 13014,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650080851.666, "dur": 6.179, "args": { "External id": 13015,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650080859.749, "dur": 17406.442, "args": { "External id": 13016,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6511 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650098478.275, "dur": 36.139, "args": { "External id": 13017,"Sequence number": 246553, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6512 } }, { "ph": "s", "id": 215, "pid": 1336754, "tid": 1336754, "ts": 1295650098478.275, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650098501.381, "dur": 7.360, "args": { "External id": 13018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650098504.379, "dur": 4.145, "args": { "External id": 13019,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6514 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650098580.644, "dur": 79.662, "args": { "External id": 13020,"Record function id": 0, "Ev Idx": 6515 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650098661.920, "dur": 1124.096, "args": { "External id": 13021,"Record function id": 0, "Ev Idx": 6516 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650098702.915, "dur": 1069.078, "args": { "External id": 13022,"Sequence number": 246554, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6517 } }, { "ph": "s", "id": 214, "pid": 1336754, "tid": 1336754, "ts": 1295650098702.915, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650098769.300, "dur": 43.773, "args": { "External id": 13023,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650098825.659, "dur": 105.870, "args": { "External id": 13024,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650098941.891, "dur": 38.992, "args": { "External id": 13025,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650099032.149, "dur": 38.267, "args": { "External id": 13026,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6521 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650099099.033, "dur": 28.745, "args": { "External id": 13027,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6522 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650099147.039, "dur": 16.267, "args": { "External id": 13028,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6523 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650099182.922, "dur": 152.451, "args": { "External id": 13029,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650099249.280, "dur": 12.027, "args": { "External id": 13030,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650099253.904, "dur": 6.549, "args": { "External id": 13031,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650099264.357, "dur": 5.504, "args": { "External id": 13032,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650099271.234, "dur": 1.328, "args": { "External id": 13033,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650099275.757, "dur": 5.019, "args": { "External id": 13034,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650099346.590, "dur": 52.802, "args": { "External id": 13035,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6530 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650099432.796, "dur": 30.938, "args": { "External id": 13036,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650099473.625, "dur": 43.171, "args": { "External id": 13037,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650099525.865, "dur": 35.442, "args": { "External id": 13038,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6533 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650099585.647, "dur": 28.270, "args": { "External id": 13039,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650099620.205, "dur": 33.548, "args": { "External id": 13040,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6535 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650099676.101, "dur": 24.791, "args": { "External id": 13041,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6536 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.6)", "pid": 1336754, "tid": 1336754, "ts": 1295650099849.164, "dur": 72.331, "args": { "External id": 13042,"Record function id": 0, "Ev Idx": 6537 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650100035.760, "dur": 52.264, "args": { "External id": 13043,"Record function id": 0, "Ev Idx": 6538 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.7)", "pid": 1336754, "tid": 1336754, "ts": 1295650100096.988, "dur": 18650.516, "args": { "External id": 13044,"Record function id": 0, "Ev Idx": 6539 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.7)", "pid": 1336754, "tid": 1336754, "ts": 1295650100107.086, "dur": 855.087, "args": { "External id": 13045,"Record function id": 0, "Ev Idx": 6540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650100188.265, "dur": 10.037, "args": { "External id": 13046,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650100212.659, "dur": 52.704, "args": { "External id": 13047,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100218.274, "dur": 2.359, "args": { "External id": 13048,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100225.032, "dur": 0.204, "args": { "External id": 13049,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100226.638, "dur": 14.172, "args": { "External id": 13050,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100243.928, "dur": 0.387, "args": { "External id": 13051,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100248.001, "dur": 0.224, "args": { "External id": 13052,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100249.632, "dur": 0.429, "args": { "External id": 13053,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100251.114, "dur": 4.060, "args": { "External id": 13054,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100256.801, "dur": 0.426, "args": { "External id": 13055,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100258.777, "dur": 0.365, "args": { "External id": 13056,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650100278.228, "dur": 44.402, "args": { "External id": 13057,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6552 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650100357.472, "dur": 110.823, "args": { "External id": 13058,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650100369.064, "dur": 4.850, "args": { "External id": 13059,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650100379.193, "dur": 10.374, "args": { "External id": 13060,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650100383.830, "dur": 5.337, "args": { "External id": 13061,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100387.124, "dur": 0.864, "args": { "External id": 13062,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650100396.971, "dur": 29.873, "args": { "External id": 13063,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100399.018, "dur": 2.853, "args": { "External id": 13064,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100403.264, "dur": 0.383, "args": { "External id": 13065,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100404.706, "dur": 0.215, "args": { "External id": 13066,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100409.467, "dur": 1.263, "args": { "External id": 13067,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100411.926, "dur": 0.296, "args": { "External id": 13068,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100413.765, "dur": 0.308, "args": { "External id": 13069,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100417.069, "dur": 0.160, "args": { "External id": 13070,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100418.668, "dur": 0.158, "args": { "External id": 13071,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650100420.208, "dur": 2.532, "args": { "External id": 13072,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650100439.371, "dur": 21.439, "args": { "External id": 13073,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6568 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650100522.061, "dur": 352.965, "args": { "External id": 13074,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6569 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650100552.962, "dur": 317.515, "args": { "External id": 13075,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6570, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650100564.602, "dur": 300.364, "args": { "External id": 13076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6571 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650100898.948, "dur": 2.316, "args": { "External id": 13077,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6572, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.7)", "pid": 1336754, "tid": 1336754, "ts": 1295650101021.611, "dur": 17530.705, "args": { "External id": 13078,"Record function id": 0, "Ev Idx": 6573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101133.879, "dur": 6.781, "args": { "External id": 13079,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101144.801, "dur": 1.006, "args": { "External id": 13080,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101147.579, "dur": 2.065, "args": { "External id": 13081,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101153.245, "dur": 0.910, "args": { "External id": 13082,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101155.346, "dur": 0.861, "args": { "External id": 13083,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101157.448, "dur": 0.711, "args": { "External id": 13084,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101159.918, "dur": 0.885, "args": { "External id": 13085,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101164.787, "dur": 2.083, "args": { "External id": 13086,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101168.334, "dur": 0.466, "args": { "External id": 13087,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650101170.443, "dur": 0.776, "args": { "External id": 13088,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6583 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650101190.637, "dur": 17321.305, "args": { "External id": 13089,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650101206.285, "dur": 17298.509, "args": { "External id": 13090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650101226.215, "dur": 29.795, "args": { "External id": 13091,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650101262.644, "dur": 17206.893, "args": { "External id": 13092,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650101265.257, "dur": 17203.671, "args": { "External id": 13093,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650101271.286, "dur": 6.123, "args": { "External id": 13094,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650101279.281, "dur": 17186.412, "args": { "External id": 13095,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6590 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650118683.868, "dur": 39.874, "args": { "External id": 13096,"Sequence number": 246555, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6591 } }, { "ph": "s", "id": 213, "pid": 1336754, "tid": 1336754, "ts": 1295650118683.868, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650118711.455, "dur": 7.295, "args": { "External id": 13097,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650118714.279, "dur": 4.218, "args": { "External id": 13098,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6593 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650118788.433, "dur": 75.932, "args": { "External id": 13099,"Record function id": 0, "Ev Idx": 6594 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650118865.949, "dur": 1107.102, "args": { "External id": 13100,"Record function id": 0, "Ev Idx": 6595 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650118907.080, "dur": 1052.865, "args": { "External id": 13101,"Sequence number": 246556, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6596 } }, { "ph": "s", "id": 212, "pid": 1336754, "tid": 1336754, "ts": 1295650118907.080, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650118977.178, "dur": 77.498, "args": { "External id": 13102,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119071.294, "dur": 104.175, "args": { "External id": 13103,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119186.316, "dur": 54.458, "args": { "External id": 13104,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119254.268, "dur": 35.980, "args": { "External id": 13105,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6600 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650119318.153, "dur": 29.511, "args": { "External id": 13106,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6601 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650119365.469, "dur": 16.063, "args": { "External id": 13107,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6602 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650119400.160, "dur": 138.991, "args": { "External id": 13108,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650119452.916, "dur": 11.621, "args": { "External id": 13109,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650119457.956, "dur": 5.778, "args": { "External id": 13110,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650119467.300, "dur": 6.233, "args": { "External id": 13111,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650119480.885, "dur": 1.232, "args": { "External id": 13112,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650119484.656, "dur": 4.336, "args": { "External id": 13113,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119549.622, "dur": 52.191, "args": { "External id": 13114,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6609 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650119634.986, "dur": 27.860, "args": { "External id": 13115,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119672.423, "dur": 42.708, "args": { "External id": 13116,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119724.194, "dur": 36.062, "args": { "External id": 13117,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6612 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650119782.784, "dur": 25.922, "args": { "External id": 13118,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650119814.455, "dur": 34.825, "args": { "External id": 13119,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6614 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650119872.057, "dur": 19.086, "args": { "External id": 13120,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6615 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.7)", "pid": 1336754, "tid": 1336754, "ts": 1295650120077.404, "dur": 75.982, "args": { "External id": 13121,"Record function id": 0, "Ev Idx": 6616 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650120226.652, "dur": 67.726, "args": { "External id": 13122,"Record function id": 0, "Ev Idx": 6617 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.8)", "pid": 1336754, "tid": 1336754, "ts": 1295650120304.576, "dur": 18812.642, "args": { "External id": 13123,"Record function id": 0, "Ev Idx": 6618 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.8)", "pid": 1336754, "tid": 1336754, "ts": 1295650120315.945, "dur": 824.248, "args": { "External id": 13124,"Record function id": 0, "Ev Idx": 6619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650120399.812, "dur": 8.609, "args": { "External id": 13125,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650120423.161, "dur": 35.805, "args": { "External id": 13126,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120428.761, "dur": 2.238, "args": { "External id": 13127,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120435.835, "dur": 0.451, "args": { "External id": 13128,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120437.407, "dur": 0.198, "args": { "External id": 13129,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120439.153, "dur": 0.415, "args": { "External id": 13130,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120442.277, "dur": 0.451, "args": { "External id": 13131,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120444.276, "dur": 0.476, "args": { "External id": 13132,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120445.713, "dur": 3.837, "args": { "External id": 13133,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120450.986, "dur": 0.412, "args": { "External id": 13134,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120452.639, "dur": 0.414, "args": { "External id": 13135,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650120470.852, "dur": 43.898, "args": { "External id": 13136,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6631 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650120547.366, "dur": 108.698, "args": { "External id": 13137,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650120557.298, "dur": 4.178, "args": { "External id": 13138,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650120566.160, "dur": 10.686, "args": { "External id": 13139,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650120571.103, "dur": 5.361, "args": { "External id": 13140,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120574.607, "dur": 0.656, "args": { "External id": 13141,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650120583.649, "dur": 31.461, "args": { "External id": 13142,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120586.267, "dur": 2.652, "args": { "External id": 13143,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120590.762, "dur": 0.437, "args": { "External id": 13144,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120592.319, "dur": 0.188, "args": { "External id": 13145,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120596.485, "dur": 1.259, "args": { "External id": 13146,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120599.156, "dur": 0.181, "args": { "External id": 13147,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120600.969, "dur": 0.275, "args": { "External id": 13148,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120604.810, "dur": 0.379, "args": { "External id": 13149,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120606.903, "dur": 0.166, "args": { "External id": 13150,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650120608.081, "dur": 2.777, "args": { "External id": 13151,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650120625.733, "dur": 22.015, "args": { "External id": 13152,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6647 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650120708.272, "dur": 335.251, "args": { "External id": 13153,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6648 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650120739.835, "dur": 298.484, "args": { "External id": 13154,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6649, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650120752.934, "dur": 279.649, "args": { "External id": 13155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6650 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650121069.817, "dur": 2.792, "args": { "External id": 13156,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6651, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.8)", "pid": 1336754, "tid": 1336754, "ts": 1295650121161.551, "dur": 17733.567, "args": { "External id": 13157,"Record function id": 0, "Ev Idx": 6652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121282.804, "dur": 6.950, "args": { "External id": 13158,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121293.688, "dur": 1.338, "args": { "External id": 13159,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121296.725, "dur": 2.670, "args": { "External id": 13160,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121301.279, "dur": 0.883, "args": { "External id": 13161,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121303.551, "dur": 1.073, "args": { "External id": 13162,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121305.835, "dur": 0.902, "args": { "External id": 13163,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121310.451, "dur": 0.953, "args": { "External id": 13164,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121313.477, "dur": 2.006, "args": { "External id": 13165,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121316.944, "dur": 0.903, "args": { "External id": 13166,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650121319.371, "dur": 0.908, "args": { "External id": 13167,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6662 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650121352.622, "dur": 17504.870, "args": { "External id": 13168,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650121369.360, "dur": 17481.293, "args": { "External id": 13169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650121389.736, "dur": 16.175, "args": { "External id": 13170,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650121408.953, "dur": 17407.238, "args": { "External id": 13171,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650121411.775, "dur": 17403.913, "args": { "External id": 13172,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650121418.229, "dur": 5.485, "args": { "External id": 13173,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650121425.350, "dur": 17387.230, "args": { "External id": 13174,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6669 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650139054.586, "dur": 37.302, "args": { "External id": 13175,"Sequence number": 246557, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6670 } }, { "ph": "s", "id": 211, "pid": 1336754, "tid": 1336754, "ts": 1295650139054.586, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650139078.978, "dur": 7.737, "args": { "External id": 13176,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650139081.998, "dur": 4.422, "args": { "External id": 13177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6672 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650139157.059, "dur": 91.662, "args": { "External id": 13178,"Record function id": 0, "Ev Idx": 6673 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650139251.854, "dur": 1108.323, "args": { "External id": 13179,"Record function id": 0, "Ev Idx": 6674 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650139295.182, "dur": 1051.416, "args": { "External id": 13180,"Sequence number": 246558, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6675 } }, { "ph": "s", "id": 210, "pid": 1336754, "tid": 1336754, "ts": 1295650139295.182, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650139362.745, "dur": 44.121, "args": { "External id": 13181,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650139420.035, "dur": 105.293, "args": { "External id": 13182,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650139535.496, "dur": 39.080, "args": { "External id": 13183,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650139583.419, "dur": 30.894, "args": { "External id": 13184,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6679 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650139641.236, "dur": 25.245, "args": { "External id": 13185,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6680 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650139685.224, "dur": 17.954, "args": { "External id": 13186,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6681 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650139722.244, "dur": 130.674, "args": { "External id": 13187,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650139772.717, "dur": 11.676, "args": { "External id": 13188,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650139778.014, "dur": 5.666, "args": { "External id": 13189,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650139786.898, "dur": 5.988, "args": { "External id": 13190,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650139794.279, "dur": 1.220, "args": { "External id": 13191,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650139798.086, "dur": 4.439, "args": { "External id": 13192,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650139863.074, "dur": 46.327, "args": { "External id": 13193,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6688 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650139941.858, "dur": 26.404, "args": { "External id": 13194,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650139977.278, "dur": 85.619, "args": { "External id": 13195,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650140075.470, "dur": 41.298, "args": { "External id": 13196,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6691 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650140142.363, "dur": 31.371, "args": { "External id": 13197,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650140179.874, "dur": 34.315, "args": { "External id": 13198,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6693 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650140248.762, "dur": 21.567, "args": { "External id": 13199,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6694 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.8)", "pid": 1336754, "tid": 1336754, "ts": 1295650140425.963, "dur": 80.916, "args": { "External id": 13200,"Record function id": 0, "Ev Idx": 6695 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650140579.725, "dur": 46.899, "args": { "External id": 13201,"Record function id": 0, "Ev Idx": 6696 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.9)", "pid": 1336754, "tid": 1336754, "ts": 1295650140635.384, "dur": 18656.866, "args": { "External id": 13202,"Record function id": 0, "Ev Idx": 6697 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.9)", "pid": 1336754, "tid": 1336754, "ts": 1295650140646.044, "dur": 949.864, "args": { "External id": 13203,"Record function id": 0, "Ev Idx": 6698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650140727.296, "dur": 8.758, "args": { "External id": 13204,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650140749.604, "dur": 35.661, "args": { "External id": 13205,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140754.799, "dur": 2.368, "args": { "External id": 13206,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140761.862, "dur": 0.466, "args": { "External id": 13207,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140763.907, "dur": 0.463, "args": { "External id": 13208,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140765.405, "dur": 0.432, "args": { "External id": 13209,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140770.006, "dur": 0.452, "args": { "External id": 13210,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140771.464, "dur": 0.532, "args": { "External id": 13211,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140773.901, "dur": 2.346, "args": { "External id": 13212,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140777.087, "dur": 0.609, "args": { "External id": 13213,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140779.340, "dur": 0.300, "args": { "External id": 13214,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650140796.094, "dur": 38.467, "args": { "External id": 13215,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6710 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650140867.813, "dur": 161.623, "args": { "External id": 13216,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650140878.561, "dur": 4.015, "args": { "External id": 13217,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650140887.398, "dur": 10.467, "args": { "External id": 13218,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650140892.085, "dur": 5.400, "args": { "External id": 13219,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140895.534, "dur": 0.642, "args": { "External id": 13220,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650140904.323, "dur": 34.814, "args": { "External id": 13221,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140906.254, "dur": 2.566, "args": { "External id": 13222,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140914.863, "dur": 0.583, "args": { "External id": 13223,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140917.631, "dur": 0.450, "args": { "External id": 13224,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140921.387, "dur": 1.668, "args": { "External id": 13225,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140924.441, "dur": 0.383, "args": { "External id": 13226,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140926.264, "dur": 2.396, "args": { "External id": 13227,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140930.332, "dur": 0.185, "args": { "External id": 13228,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140931.315, "dur": 0.321, "args": { "External id": 13229,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650140935.137, "dur": 0.353, "args": { "External id": 13230,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650140959.506, "dur": 59.723, "args": { "External id": 13231,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6726 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650141087.171, "dur": 409.585, "args": { "External id": 13232,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6727 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650141118.457, "dur": 372.887, "args": { "External id": 13233,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6728, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650141131.587, "dur": 353.862, "args": { "External id": 13234,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6729 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650141523.208, "dur": 2.250, "args": { "External id": 13235,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6730, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.9)", "pid": 1336754, "tid": 1336754, "ts": 1295650141618.528, "dur": 17454.596, "args": { "External id": 13236,"Record function id": 0, "Ev Idx": 6731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141725.859, "dur": 7.060, "args": { "External id": 13237,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141736.518, "dur": 1.115, "args": { "External id": 13238,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141739.630, "dur": 2.394, "args": { "External id": 13239,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141743.954, "dur": 0.735, "args": { "External id": 13240,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141746.112, "dur": 0.877, "args": { "External id": 13241,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141748.606, "dur": 0.905, "args": { "External id": 13242,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141753.031, "dur": 0.861, "args": { "External id": 13243,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141755.549, "dur": 2.262, "args": { "External id": 13244,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141759.202, "dur": 0.848, "args": { "External id": 13245,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650141761.802, "dur": 0.762, "args": { "External id": 13246,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6741 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650141784.272, "dur": 17248.587, "args": { "External id": 13247,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650141801.175, "dur": 17224.181, "args": { "External id": 13248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650141821.675, "dur": 14.778, "args": { "External id": 13249,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650141839.533, "dur": 17129.843, "args": { "External id": 13250,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650141842.137, "dur": 17126.546, "args": { "External id": 13251,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650141848.230, "dur": 5.635, "args": { "External id": 13252,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650141855.546, "dur": 17109.902, "args": { "External id": 13253,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6748 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650159215.458, "dur": 50.278, "args": { "External id": 13254,"Sequence number": 246559, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6749 } }, { "ph": "s", "id": 209, "pid": 1336754, "tid": 1336754, "ts": 1295650159215.458, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650159251.014, "dur": 8.914, "args": { "External id": 13255,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650159254.581, "dur": 4.961, "args": { "External id": 13256,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6751 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650159332.377, "dur": 75.400, "args": { "External id": 13257,"Record function id": 0, "Ev Idx": 6752 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650159409.745, "dur": 1112.121, "args": { "External id": 13258,"Record function id": 0, "Ev Idx": 6753 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650159451.316, "dur": 1057.508, "args": { "External id": 13259,"Sequence number": 246560, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6754 } }, { "ph": "s", "id": 208, "pid": 1336754, "tid": 1336754, "ts": 1295650159451.316, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650159518.940, "dur": 45.509, "args": { "External id": 13260,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650159576.757, "dur": 107.253, "args": { "External id": 13261,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650159694.502, "dur": 40.030, "args": { "External id": 13262,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650159743.047, "dur": 31.003, "args": { "External id": 13263,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6758 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650159799.359, "dur": 26.641, "args": { "External id": 13264,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6759 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650159843.871, "dur": 15.553, "args": { "External id": 13265,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6760 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650159877.039, "dur": 168.059, "args": { "External id": 13266,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650159923.708, "dur": 11.232, "args": { "External id": 13267,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650159928.230, "dur": 5.940, "args": { "External id": 13268,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650159937.552, "dur": 6.502, "args": { "External id": 13269,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650159945.527, "dur": 1.423, "args": { "External id": 13270,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650159949.115, "dur": 3.906, "args": { "External id": 13271,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650160058.112, "dur": 57.009, "args": { "External id": 13272,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6767 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650160147.954, "dur": 29.773, "args": { "External id": 13273,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650160194.231, "dur": 57.611, "args": { "External id": 13274,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650160263.919, "dur": 39.352, "args": { "External id": 13275,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6770 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650160329.759, "dur": 29.366, "args": { "External id": 13276,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650160364.730, "dur": 35.045, "args": { "External id": 13277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6772 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650160419.939, "dur": 22.514, "args": { "External id": 13278,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6773 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.9)", "pid": 1336754, "tid": 1336754, "ts": 1295650160584.425, "dur": 74.073, "args": { "External id": 13279,"Record function id": 0, "Ev Idx": 6774 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650160729.783, "dur": 45.339, "args": { "External id": 13280,"Record function id": 0, "Ev Idx": 6775 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.10)", "pid": 1336754, "tid": 1336754, "ts": 1295650160784.210, "dur": 18517.390, "args": { "External id": 13281,"Record function id": 0, "Ev Idx": 6776 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.10)", "pid": 1336754, "tid": 1336754, "ts": 1295650160793.106, "dur": 937.380, "args": { "External id": 13282,"Record function id": 0, "Ev Idx": 6777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650160871.849, "dur": 7.705, "args": { "External id": 13283,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650160893.076, "dur": 38.079, "args": { "External id": 13284,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160898.486, "dur": 2.117, "args": { "External id": 13285,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160905.343, "dur": 0.588, "args": { "External id": 13286,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160907.940, "dur": 0.515, "args": { "External id": 13287,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160909.890, "dur": 0.643, "args": { "External id": 13288,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160914.001, "dur": 0.393, "args": { "External id": 13289,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160915.655, "dur": 0.392, "args": { "External id": 13290,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160917.914, "dur": 3.736, "args": { "External id": 13291,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160922.861, "dur": 0.714, "args": { "External id": 13292,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650160924.803, "dur": 0.497, "args": { "External id": 13293,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650160941.891, "dur": 37.831, "args": { "External id": 13294,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6789 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650161055.328, "dur": 113.163, "args": { "External id": 13295,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650161066.784, "dur": 6.385, "args": { "External id": 13296,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650161078.462, "dur": 10.878, "args": { "External id": 13297,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650161082.813, "dur": 6.125, "args": { "External id": 13298,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161086.482, "dur": 0.784, "args": { "External id": 13299,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650161096.531, "dur": 29.195, "args": { "External id": 13300,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161098.811, "dur": 2.761, "args": { "External id": 13301,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161103.027, "dur": 0.468, "args": { "External id": 13302,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161104.956, "dur": 0.450, "args": { "External id": 13303,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161108.670, "dur": 1.728, "args": { "External id": 13304,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161112.193, "dur": 0.324, "args": { "External id": 13305,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161113.678, "dur": 0.150, "args": { "External id": 13306,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161116.246, "dur": 0.384, "args": { "External id": 13307,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161117.717, "dur": 0.180, "args": { "External id": 13308,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161119.154, "dur": 2.354, "args": { "External id": 13309,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650161136.512, "dur": 24.377, "args": { "External id": 13310,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6805 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650161223.796, "dur": 405.969, "args": { "External id": 13311,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6806 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650161271.066, "dur": 353.780, "args": { "External id": 13312,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6807, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650161313.130, "dur": 306.356, "args": { "External id": 13313,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6808 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650161656.405, "dur": 2.080, "args": { "External id": 13314,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6809, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.10)", "pid": 1336754, "tid": 1336754, "ts": 1295650161752.061, "dur": 17340.931, "args": { "External id": 13315,"Record function id": 0, "Ev Idx": 6810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161854.152, "dur": 6.433, "args": { "External id": 13316,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161864.519, "dur": 0.978, "args": { "External id": 13317,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161867.065, "dur": 2.534, "args": { "External id": 13318,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161871.278, "dur": 0.972, "args": { "External id": 13319,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161873.425, "dur": 0.478, "args": { "External id": 13320,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161875.344, "dur": 0.734, "args": { "External id": 13321,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161879.670, "dur": 0.960, "args": { "External id": 13322,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161882.200, "dur": 1.862, "args": { "External id": 13323,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161885.377, "dur": 0.435, "args": { "External id": 13324,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650161887.415, "dur": 0.410, "args": { "External id": 13325,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6820 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650161907.496, "dur": 17145.062, "args": { "External id": 13326,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650161923.756, "dur": 17121.589, "args": { "External id": 13327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650161942.375, "dur": 15.219, "args": { "External id": 13328,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650161960.535, "dur": 17048.328, "args": { "External id": 13329,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650161963.358, "dur": 17044.894, "args": { "External id": 13330,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650161969.555, "dur": 5.434, "args": { "External id": 13331,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650161976.933, "dur": 17027.952, "args": { "External id": 13332,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6827 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650179225.813, "dur": 48.869, "args": { "External id": 13333,"Sequence number": 246561, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6828 } }, { "ph": "s", "id": 207, "pid": 1336754, "tid": 1336754, "ts": 1295650179225.813, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650179260.903, "dur": 8.266, "args": { "External id": 13334,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650179264.486, "dur": 4.322, "args": { "External id": 13335,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6830 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650179343.159, "dur": 79.216, "args": { "External id": 13336,"Record function id": 0, "Ev Idx": 6831 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650179423.857, "dur": 1121.139, "args": { "External id": 13337,"Record function id": 0, "Ev Idx": 6832 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650179465.529, "dur": 1065.945, "args": { "External id": 13338,"Sequence number": 246562, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6833 } }, { "ph": "s", "id": 206, "pid": 1336754, "tid": 1336754, "ts": 1295650179465.529, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650179536.571, "dur": 42.754, "args": { "External id": 13339,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650179592.251, "dur": 108.869, "args": { "External id": 13340,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650179711.880, "dur": 41.353, "args": { "External id": 13341,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650179762.967, "dur": 31.771, "args": { "External id": 13342,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6837 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650179819.826, "dur": 26.537, "args": { "External id": 13343,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6838 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650179865.420, "dur": 17.525, "args": { "External id": 13344,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6839 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650179900.524, "dur": 172.405, "args": { "External id": 13345,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650179947.903, "dur": 11.311, "args": { "External id": 13346,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650179952.734, "dur": 5.756, "args": { "External id": 13347,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650179961.736, "dur": 6.669, "args": { "External id": 13348,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650179970.017, "dur": 1.430, "args": { "External id": 13349,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650179973.626, "dur": 4.290, "args": { "External id": 13350,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650180084.993, "dur": 53.280, "args": { "External id": 13351,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6846 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650180173.218, "dur": 31.464, "args": { "External id": 13352,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650180213.975, "dur": 60.210, "args": { "External id": 13353,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650180286.513, "dur": 37.397, "args": { "External id": 13354,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6849 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650180348.061, "dur": 29.512, "args": { "External id": 13355,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650180383.469, "dur": 34.301, "args": { "External id": 13356,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6851 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650180440.074, "dur": 21.052, "args": { "External id": 13357,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6852 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.10)", "pid": 1336754, "tid": 1336754, "ts": 1295650180607.437, "dur": 72.822, "args": { "External id": 13358,"Record function id": 0, "Ev Idx": 6853 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650180753.545, "dur": 45.478, "args": { "External id": 13359,"Record function id": 0, "Ev Idx": 6854 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.11)", "pid": 1336754, "tid": 1336754, "ts": 1295650180807.222, "dur": 18368.568, "args": { "External id": 13360,"Record function id": 0, "Ev Idx": 6855 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.11)", "pid": 1336754, "tid": 1336754, "ts": 1295650180816.910, "dur": 910.707, "args": { "External id": 13361,"Record function id": 0, "Ev Idx": 6856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650180893.581, "dur": 8.259, "args": { "External id": 13362,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650180915.868, "dur": 38.650, "args": { "External id": 13363,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180921.592, "dur": 2.355, "args": { "External id": 13364,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180928.712, "dur": 0.282, "args": { "External id": 13365,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180930.515, "dur": 0.289, "args": { "External id": 13366,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180932.254, "dur": 0.544, "args": { "External id": 13367,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180937.514, "dur": 0.467, "args": { "External id": 13368,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180939.600, "dur": 0.418, "args": { "External id": 13369,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180941.453, "dur": 3.816, "args": { "External id": 13370,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180946.595, "dur": 0.400, "args": { "External id": 13371,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650180948.627, "dur": 0.371, "args": { "External id": 13372,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650180968.923, "dur": 79.386, "args": { "External id": 13373,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6868 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650181085.233, "dur": 113.786, "args": { "External id": 13374,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650181096.698, "dur": 7.553, "args": { "External id": 13375,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650181109.391, "dur": 11.048, "args": { "External id": 13376,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650181114.352, "dur": 5.678, "args": { "External id": 13377,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181117.888, "dur": 0.646, "args": { "External id": 13378,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650181127.417, "dur": 28.672, "args": { "External id": 13379,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181129.597, "dur": 0.528, "args": { "External id": 13380,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181131.734, "dur": 2.455, "args": { "External id": 13381,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181135.496, "dur": 0.547, "args": { "External id": 13382,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181137.674, "dur": 1.636, "args": { "External id": 13383,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181143.292, "dur": 0.199, "args": { "External id": 13384,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181144.612, "dur": 0.438, "args": { "External id": 13385,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181146.349, "dur": 0.387, "args": { "External id": 13386,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181150.242, "dur": 0.195, "args": { "External id": 13387,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181151.733, "dur": 0.442, "args": { "External id": 13388,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650181169.007, "dur": 22.718, "args": { "External id": 13389,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6884 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650181275.916, "dur": 356.250, "args": { "External id": 13390,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6885 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650181308.566, "dur": 318.462, "args": { "External id": 13391,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6886, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650181322.112, "dur": 299.413, "args": { "External id": 13392,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6887 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650181657.372, "dur": 3.663, "args": { "External id": 13393,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6888, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.11)", "pid": 1336754, "tid": 1336754, "ts": 1295650181748.109, "dur": 17207.655, "args": { "External id": 13394,"Record function id": 0, "Ev Idx": 6889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181845.207, "dur": 6.429, "args": { "External id": 13395,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181854.741, "dur": 0.998, "args": { "External id": 13396,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181857.564, "dur": 1.808, "args": { "External id": 13397,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181861.089, "dur": 0.798, "args": { "External id": 13398,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181863.493, "dur": 0.796, "args": { "External id": 13399,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181865.856, "dur": 0.499, "args": { "External id": 13400,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181870.160, "dur": 0.713, "args": { "External id": 13401,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181872.561, "dur": 1.568, "args": { "External id": 13402,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181875.629, "dur": 0.695, "args": { "External id": 13403,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650181878.042, "dur": 1.049, "args": { "External id": 13404,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6899 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650181899.004, "dur": 17018.643, "args": { "External id": 13405,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650181914.592, "dur": 16996.278, "args": { "External id": 13406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650181934.636, "dur": 15.486, "args": { "External id": 13407,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650181953.122, "dur": 16923.339, "args": { "External id": 13408,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650181955.645, "dur": 16920.295, "args": { "External id": 13409,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650181962.069, "dur": 5.600, "args": { "External id": 13410,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650181969.920, "dur": 16902.979, "args": { "External id": 13411,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6906 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650199110.990, "dur": 38.845, "args": { "External id": 13412,"Sequence number": 246563, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6907 } }, { "ph": "s", "id": 205, "pid": 1336754, "tid": 1336754, "ts": 1295650199110.990, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650199136.876, "dur": 7.816, "args": { "External id": 13413,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650199139.991, "dur": 4.334, "args": { "External id": 13414,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6909 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650199217.220, "dur": 89.411, "args": { "External id": 13415,"Record function id": 0, "Ev Idx": 6910 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650199309.612, "dur": 1115.301, "args": { "External id": 13416,"Record function id": 0, "Ev Idx": 6911 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650199351.767, "dur": 1060.143, "args": { "External id": 13417,"Sequence number": 246564, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6912 } }, { "ph": "s", "id": 204, "pid": 1336754, "tid": 1336754, "ts": 1295650199351.767, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650199419.415, "dur": 44.731, "args": { "External id": 13418,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650199477.571, "dur": 104.666, "args": { "External id": 13419,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650199592.790, "dur": 39.897, "args": { "External id": 13420,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650199641.984, "dur": 30.711, "args": { "External id": 13421,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6916 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650199697.506, "dur": 28.420, "args": { "External id": 13422,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6917 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650199744.338, "dur": 14.853, "args": { "External id": 13423,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6918 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650199777.110, "dur": 130.381, "args": { "External id": 13424,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650199827.223, "dur": 11.346, "args": { "External id": 13425,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650199832.312, "dur": 5.555, "args": { "External id": 13426,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650199841.278, "dur": 6.187, "args": { "External id": 13427,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650199848.874, "dur": 1.756, "args": { "External id": 13428,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650199852.715, "dur": 4.630, "args": { "External id": 13429,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650199918.430, "dur": 49.817, "args": { "External id": 13430,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6925 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650200045.114, "dur": 32.508, "args": { "External id": 13431,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650200089.292, "dur": 46.500, "args": { "External id": 13432,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650200144.930, "dur": 35.408, "args": { "External id": 13433,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 6928 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650200205.189, "dur": 42.378, "args": { "External id": 13434,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 6929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650200255.667, "dur": 41.019, "args": { "External id": 13435,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 6930 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650200318.713, "dur": 22.606, "args": { "External id": 13436,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 6931 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.11)", "pid": 1336754, "tid": 1336754, "ts": 1295650200489.103, "dur": 72.970, "args": { "External id": 13437,"Record function id": 0, "Ev Idx": 6932 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650200633.902, "dur": 46.436, "args": { "External id": 13438,"Record function id": 0, "Ev Idx": 6933 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.12)", "pid": 1336754, "tid": 1336754, "ts": 1295650200689.670, "dur": 18498.275, "args": { "External id": 13439,"Record function id": 0, "Ev Idx": 6934 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.12)", "pid": 1336754, "tid": 1336754, "ts": 1295650200697.391, "dur": 905.120, "args": { "External id": 13440,"Record function id": 0, "Ev Idx": 6935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650200779.056, "dur": 8.385, "args": { "External id": 13441,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650200804.123, "dur": 38.210, "args": { "External id": 13442,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200810.333, "dur": 2.399, "args": { "External id": 13443,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200816.839, "dur": 0.518, "args": { "External id": 13444,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200819.346, "dur": 0.461, "args": { "External id": 13445,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200821.071, "dur": 2.277, "args": { "External id": 13446,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200824.727, "dur": 0.268, "args": { "External id": 13447,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200825.949, "dur": 0.641, "args": { "External id": 13448,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200830.830, "dur": 1.740, "args": { "External id": 13449,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200833.823, "dur": 0.380, "args": { "External id": 13450,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200836.293, "dur": 0.380, "args": { "External id": 13451,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650200853.274, "dur": 37.841, "args": { "External id": 13452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6947 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650200923.512, "dur": 153.437, "args": { "External id": 13453,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 6948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650200933.344, "dur": 4.307, "args": { "External id": 13454,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650200942.866, "dur": 11.830, "args": { "External id": 13455,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650200947.291, "dur": 6.972, "args": { "External id": 13456,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 6951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200950.568, "dur": 2.512, "args": { "External id": 13457,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 6952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650200961.367, "dur": 68.724, "args": { "External id": 13458,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 6953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200963.493, "dur": 0.483, "args": { "External id": 13459,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200965.250, "dur": 0.298, "args": { "External id": 13460,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200967.928, "dur": 0.355, "args": { "External id": 13461,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200971.456, "dur": 1.969, "args": { "External id": 13462,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200974.516, "dur": 0.380, "args": { "External id": 13463,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200976.022, "dur": 2.480, "args": { "External id": 13464,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650200980.033, "dur": 0.369, "args": { "External id": 13465,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650201019.872, "dur": 0.509, "args": { "External id": 13466,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650201025.302, "dur": 0.432, "args": { "External id": 13467,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 6962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650201042.630, "dur": 26.081, "args": { "External id": 13468,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 6963 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650201134.516, "dur": 373.490, "args": { "External id": 13469,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 6964 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650201168.689, "dur": 334.591, "args": { "External id": 13470,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 6965, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650201179.228, "dur": 318.167, "args": { "External id": 13471,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 6966 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650201534.637, "dur": 2.253, "args": { "External id": 13472,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 6967, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.12)", "pid": 1336754, "tid": 1336754, "ts": 1295650201622.742, "dur": 17341.784, "args": { "External id": 13473,"Record function id": 0, "Ev Idx": 6968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201721.153, "dur": 6.186, "args": { "External id": 13474,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 6969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201730.883, "dur": 1.524, "args": { "External id": 13475,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201734.147, "dur": 2.658, "args": { "External id": 13476,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201738.510, "dur": 0.729, "args": { "External id": 13477,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201740.662, "dur": 0.531, "args": { "External id": 13478,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201742.660, "dur": 0.671, "args": { "External id": 13479,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 6974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201747.509, "dur": 0.735, "args": { "External id": 13480,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 6975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201749.896, "dur": 1.824, "args": { "External id": 13481,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201753.324, "dur": 0.685, "args": { "External id": 13482,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650201755.448, "dur": 0.448, "args": { "External id": 13483,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 6978 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650201776.083, "dur": 17148.834, "args": { "External id": 13484,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650201792.189, "dur": 17125.498, "args": { "External id": 13485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 6980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650201811.755, "dur": 15.380, "args": { "External id": 13486,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650201830.586, "dur": 17052.192, "args": { "External id": 13487,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 6982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650201832.795, "dur": 17049.346, "args": { "External id": 13488,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 6983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650201838.546, "dur": 5.738, "args": { "External id": 13489,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 6984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650201845.901, "dur": 17032.924, "args": { "External id": 13490,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 6985 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650219123.863, "dur": 39.129, "args": { "External id": 13491,"Sequence number": 246565, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 6986 } }, { "ph": "s", "id": 203, "pid": 1336754, "tid": 1336754, "ts": 1295650219123.863, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650219150.094, "dur": 7.580, "args": { "External id": 13492,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 6987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650219152.948, "dur": 4.402, "args": { "External id": 13493,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 6988 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650219226.487, "dur": 89.498, "args": { "External id": 13494,"Record function id": 0, "Ev Idx": 6989 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650219318.808, "dur": 1107.781, "args": { "External id": 13495,"Record function id": 0, "Ev Idx": 6990 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650219362.419, "dur": 1051.025, "args": { "External id": 13496,"Sequence number": 246566, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 6991 } }, { "ph": "s", "id": 202, "pid": 1336754, "tid": 1336754, "ts": 1295650219362.419, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650219433.034, "dur": 44.773, "args": { "External id": 13497,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 6992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650219490.590, "dur": 104.647, "args": { "External id": 13498,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650219604.878, "dur": 38.795, "args": { "External id": 13499,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650219652.364, "dur": 32.808, "args": { "External id": 13500,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 6995 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650219709.976, "dur": 25.306, "args": { "External id": 13501,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6996 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650219755.138, "dur": 16.278, "args": { "External id": 13502,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 6997 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650219789.989, "dur": 129.854, "args": { "External id": 13503,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 6998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650219840.179, "dur": 11.367, "args": { "External id": 13504,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 6999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650219845.283, "dur": 5.525, "args": { "External id": 13505,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650219854.213, "dur": 6.341, "args": { "External id": 13506,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650219861.912, "dur": 1.258, "args": { "External id": 13507,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650219865.681, "dur": 3.647, "args": { "External id": 13508,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650219929.650, "dur": 45.856, "args": { "External id": 13509,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7004 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650220046.721, "dur": 32.055, "args": { "External id": 13510,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650220088.815, "dur": 46.850, "args": { "External id": 13511,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650220144.922, "dur": 35.148, "args": { "External id": 13512,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7007 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650220212.763, "dur": 44.887, "args": { "External id": 13513,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650220268.355, "dur": 39.469, "args": { "External id": 13514,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7009 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650220328.358, "dur": 19.434, "args": { "External id": 13515,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7010 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.12)", "pid": 1336754, "tid": 1336754, "ts": 1295650220488.632, "dur": 74.302, "args": { "External id": 13516,"Record function id": 0, "Ev Idx": 7011 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650220634.791, "dur": 45.340, "args": { "External id": 13517,"Record function id": 0, "Ev Idx": 7012 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.13)", "pid": 1336754, "tid": 1336754, "ts": 1295650220689.257, "dur": 18332.915, "args": { "External id": 13518,"Record function id": 0, "Ev Idx": 7013 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.13)", "pid": 1336754, "tid": 1336754, "ts": 1295650220697.784, "dur": 899.404, "args": { "External id": 13519,"Record function id": 0, "Ev Idx": 7014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650220777.150, "dur": 8.452, "args": { "External id": 13520,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650220799.674, "dur": 35.522, "args": { "External id": 13521,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220804.960, "dur": 2.268, "args": { "External id": 13522,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220811.893, "dur": 0.539, "args": { "External id": 13523,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220813.748, "dur": 0.305, "args": { "External id": 13524,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220815.589, "dur": 0.192, "args": { "External id": 13525,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220818.813, "dur": 0.183, "args": { "External id": 13526,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220820.644, "dur": 0.198, "args": { "External id": 13527,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220822.286, "dur": 3.802, "args": { "External id": 13528,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220827.897, "dur": 0.196, "args": { "External id": 13529,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220829.266, "dur": 0.226, "args": { "External id": 13530,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650220846.105, "dur": 38.225, "args": { "External id": 13531,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7026 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650220917.654, "dur": 154.404, "args": { "External id": 13532,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650220927.721, "dur": 3.620, "args": { "External id": 13533,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650220936.147, "dur": 10.395, "args": { "External id": 13534,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650220940.482, "dur": 5.691, "args": { "External id": 13535,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220944.286, "dur": 0.579, "args": { "External id": 13536,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650220953.523, "dur": 66.884, "args": { "External id": 13537,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220954.961, "dur": 2.715, "args": { "External id": 13538,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220959.830, "dur": 0.567, "args": { "External id": 13539,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220961.440, "dur": 0.206, "args": { "External id": 13540,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220965.163, "dur": 1.360, "args": { "External id": 13541,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220967.670, "dur": 0.219, "args": { "External id": 13542,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220969.761, "dur": 0.384, "args": { "External id": 13543,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220972.814, "dur": 0.478, "args": { "External id": 13544,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220974.987, "dur": 0.268, "args": { "External id": 13545,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650220976.394, "dur": 2.146, "args": { "External id": 13546,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650221036.362, "dur": 27.392, "args": { "External id": 13547,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7042 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650221130.059, "dur": 371.116, "args": { "External id": 13548,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7043 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650221163.626, "dur": 332.389, "args": { "External id": 13549,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7044, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650221174.371, "dur": 313.519, "args": { "External id": 13550,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7045 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650221527.906, "dur": 2.474, "args": { "External id": 13551,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7046, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.13)", "pid": 1336754, "tid": 1336754, "ts": 1295650221618.470, "dur": 17183.357, "args": { "External id": 13552,"Record function id": 0, "Ev Idx": 7047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221720.867, "dur": 6.888, "args": { "External id": 13553,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221731.263, "dur": 0.894, "args": { "External id": 13554,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221733.980, "dur": 2.696, "args": { "External id": 13555,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221738.295, "dur": 0.705, "args": { "External id": 13556,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221740.320, "dur": 0.992, "args": { "External id": 13557,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221744.895, "dur": 1.253, "args": { "External id": 13558,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221748.117, "dur": 0.870, "args": { "External id": 13559,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221750.375, "dur": 1.743, "args": { "External id": 13560,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221753.655, "dur": 1.165, "args": { "External id": 13561,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650221758.512, "dur": 0.995, "args": { "External id": 13562,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7057 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650221776.468, "dur": 16986.049, "args": { "External id": 13563,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650221792.570, "dur": 16963.053, "args": { "External id": 13564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650221813.718, "dur": 14.458, "args": { "External id": 13565,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650221831.272, "dur": 16890.512, "args": { "External id": 13566,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650221833.857, "dur": 16887.347, "args": { "External id": 13567,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650221840.022, "dur": 5.690, "args": { "External id": 13568,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650221847.362, "dur": 16870.752, "args": { "External id": 13569,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7064 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650238932.522, "dur": 35.685, "args": { "External id": 13570,"Sequence number": 246567, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7065 } }, { "ph": "s", "id": 201, "pid": 1336754, "tid": 1336754, "ts": 1295650238932.522, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650238955.885, "dur": 7.495, "args": { "External id": 13571,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650238958.866, "dur": 4.264, "args": { "External id": 13572,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7067 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650239065.023, "dur": 75.566, "args": { "External id": 13573,"Record function id": 0, "Ev Idx": 7068 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650239142.300, "dur": 1108.028, "args": { "External id": 13574,"Record function id": 0, "Ev Idx": 7069 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650239180.495, "dur": 1041.615, "args": { "External id": 13575,"Sequence number": 246568, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7070 } }, { "ph": "s", "id": 200, "pid": 1336754, "tid": 1336754, "ts": 1295650239180.495, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650239262.185, "dur": 46.360, "args": { "External id": 13576,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239322.777, "dur": 104.474, "args": { "External id": 13577,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239437.107, "dur": 39.555, "args": { "External id": 13578,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239485.490, "dur": 31.767, "args": { "External id": 13579,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7074 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650239543.976, "dur": 27.406, "args": { "External id": 13580,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7075 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650239589.312, "dur": 15.494, "args": { "External id": 13581,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7076 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650239623.160, "dur": 131.408, "args": { "External id": 13582,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650239673.998, "dur": 11.992, "args": { "External id": 13583,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650239679.081, "dur": 6.037, "args": { "External id": 13584,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650239688.824, "dur": 6.337, "args": { "External id": 13585,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650239696.616, "dur": 1.366, "args": { "External id": 13586,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650239700.493, "dur": 4.497, "args": { "External id": 13587,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239764.933, "dur": 50.215, "args": { "External id": 13588,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7083 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650239846.912, "dur": 27.621, "args": { "External id": 13589,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239883.913, "dur": 42.061, "args": { "External id": 13590,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650239934.967, "dur": 36.031, "args": { "External id": 13591,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7086 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650240034.329, "dur": 28.446, "args": { "External id": 13592,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650240069.755, "dur": 40.715, "args": { "External id": 13593,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7088 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650240132.288, "dur": 18.915, "args": { "External id": 13594,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7089 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.13)", "pid": 1336754, "tid": 1336754, "ts": 1295650240316.753, "dur": 78.548, "args": { "External id": 13595,"Record function id": 0, "Ev Idx": 7090 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650240469.145, "dur": 49.621, "args": { "External id": 13596,"Record function id": 0, "Ev Idx": 7091 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.14)", "pid": 1336754, "tid": 1336754, "ts": 1295650240527.585, "dur": 18265.328, "args": { "External id": 13597,"Record function id": 0, "Ev Idx": 7092 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.14)", "pid": 1336754, "tid": 1336754, "ts": 1295650240535.939, "dur": 941.543, "args": { "External id": 13598,"Record function id": 0, "Ev Idx": 7093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650240617.581, "dur": 8.606, "args": { "External id": 13599,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650240640.295, "dur": 44.669, "args": { "External id": 13600,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240651.189, "dur": 2.453, "args": { "External id": 13601,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240658.356, "dur": 0.663, "args": { "External id": 13602,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240660.402, "dur": 0.593, "args": { "External id": 13603,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240662.229, "dur": 2.579, "args": { "External id": 13604,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240665.699, "dur": 0.171, "args": { "External id": 13605,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240669.237, "dur": 0.409, "args": { "External id": 13606,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240672.416, "dur": 2.080, "args": { "External id": 13607,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240676.063, "dur": 0.167, "args": { "External id": 13608,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240677.187, "dur": 2.238, "args": { "External id": 13609,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650240695.557, "dur": 41.109, "args": { "External id": 13610,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7105 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650240768.317, "dur": 106.053, "args": { "External id": 13611,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650240778.799, "dur": 3.769, "args": { "External id": 13612,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650240788.141, "dur": 9.849, "args": { "External id": 13613,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650240792.356, "dur": 5.231, "args": { "External id": 13614,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240795.798, "dur": 0.647, "args": { "External id": 13615,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650240804.551, "dur": 28.999, "args": { "External id": 13616,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240806.363, "dur": 0.460, "args": { "External id": 13617,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240808.973, "dur": 0.412, "args": { "External id": 13618,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240810.494, "dur": 2.963, "args": { "External id": 13619,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240814.777, "dur": 1.986, "args": { "External id": 13620,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240817.987, "dur": 0.200, "args": { "External id": 13621,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240822.321, "dur": 0.396, "args": { "External id": 13622,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240824.143, "dur": 0.361, "args": { "External id": 13623,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240825.934, "dur": 0.202, "args": { "External id": 13624,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650240829.310, "dur": 0.406, "args": { "External id": 13625,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650240844.752, "dur": 22.003, "args": { "External id": 13626,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7121 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650240926.039, "dur": 447.513, "args": { "External id": 13627,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7122 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650240959.578, "dur": 407.851, "args": { "External id": 13628,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7123, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650240969.457, "dur": 391.429, "args": { "External id": 13629,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7124 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650241401.904, "dur": 2.637, "args": { "External id": 13630,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7125, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.14)", "pid": 1336754, "tid": 1336754, "ts": 1295650241499.458, "dur": 17096.741, "args": { "External id": 13631,"Record function id": 0, "Ev Idx": 7126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241601.672, "dur": 6.817, "args": { "External id": 13632,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241611.986, "dur": 1.391, "args": { "External id": 13633,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241615.224, "dur": 3.542, "args": { "External id": 13634,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241620.655, "dur": 0.910, "args": { "External id": 13635,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241622.829, "dur": 1.112, "args": { "External id": 13636,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241625.277, "dur": 0.697, "args": { "External id": 13637,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241629.891, "dur": 1.094, "args": { "External id": 13638,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241632.737, "dur": 2.120, "args": { "External id": 13639,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241636.062, "dur": 0.915, "args": { "External id": 13640,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650241638.651, "dur": 0.993, "args": { "External id": 13641,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7136 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650241659.015, "dur": 16898.457, "args": { "External id": 13642,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650241674.813, "dur": 16875.740, "args": { "External id": 13643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650241696.027, "dur": 14.826, "args": { "External id": 13644,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650241713.862, "dur": 16801.930, "args": { "External id": 13645,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650241716.419, "dur": 16798.805, "args": { "External id": 13646,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650241722.754, "dur": 5.251, "args": { "External id": 13647,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650241729.912, "dur": 16781.954, "args": { "External id": 13648,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7143 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650258730.469, "dur": 36.662, "args": { "External id": 13649,"Sequence number": 246569, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7144 } }, { "ph": "s", "id": 199, "pid": 1336754, "tid": 1336754, "ts": 1295650258730.469, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650258753.796, "dur": 8.193, "args": { "External id": 13650,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650258757.493, "dur": 4.295, "args": { "External id": 13651,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7146 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650258831.624, "dur": 77.792, "args": { "External id": 13652,"Record function id": 0, "Ev Idx": 7147 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650258911.142, "dur": 1148.706, "args": { "External id": 13653,"Record function id": 0, "Ev Idx": 7148 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650258950.742, "dur": 1094.434, "args": { "External id": 13654,"Sequence number": 246570, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7149 } }, { "ph": "s", "id": 198, "pid": 1336754, "tid": 1336754, "ts": 1295650258950.742, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650259053.847, "dur": 47.400, "args": { "External id": 13655,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259115.270, "dur": 106.516, "args": { "External id": 13656,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259249.621, "dur": 44.178, "args": { "External id": 13657,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259304.728, "dur": 32.485, "args": { "External id": 13658,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7153 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650259364.580, "dur": 29.451, "args": { "External id": 13659,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7154 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650259412.678, "dur": 16.453, "args": { "External id": 13660,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7155 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650259448.374, "dur": 142.228, "args": { "External id": 13661,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650259507.672, "dur": 12.214, "args": { "External id": 13662,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650259513.046, "dur": 6.091, "args": { "External id": 13663,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650259522.970, "dur": 6.104, "args": { "External id": 13664,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650259530.545, "dur": 1.601, "args": { "External id": 13665,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650259534.583, "dur": 4.912, "args": { "External id": 13666,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259601.415, "dur": 48.164, "args": { "External id": 13667,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7162 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650259683.511, "dur": 29.332, "args": { "External id": 13668,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259722.750, "dur": 43.218, "args": { "External id": 13669,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259774.765, "dur": 35.956, "args": { "External id": 13670,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7165 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650259831.920, "dur": 27.602, "args": { "External id": 13671,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650259865.065, "dur": 34.597, "args": { "External id": 13672,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7167 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650259922.087, "dur": 18.469, "args": { "External id": 13673,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7168 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.14)", "pid": 1336754, "tid": 1336754, "ts": 1295650260125.573, "dur": 76.124, "args": { "External id": 13674,"Record function id": 0, "Ev Idx": 7169 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650260293.616, "dur": 48.263, "args": { "External id": 13675,"Record function id": 0, "Ev Idx": 7170 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.15)", "pid": 1336754, "tid": 1336754, "ts": 1295650260350.998, "dur": 18236.231, "args": { "External id": 13676,"Record function id": 0, "Ev Idx": 7171 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.15)", "pid": 1336754, "tid": 1336754, "ts": 1295650260359.799, "dur": 968.250, "args": { "External id": 13677,"Record function id": 0, "Ev Idx": 7172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650260438.996, "dur": 9.198, "args": { "External id": 13678,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650260462.600, "dur": 38.406, "args": { "External id": 13679,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260468.496, "dur": 2.388, "args": { "External id": 13680,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260475.812, "dur": 0.654, "args": { "External id": 13681,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260478.165, "dur": 0.442, "args": { "External id": 13682,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260480.039, "dur": 0.522, "args": { "External id": 13683,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260484.314, "dur": 0.493, "args": { "External id": 13684,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260485.805, "dur": 0.207, "args": { "External id": 13685,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260487.739, "dur": 4.095, "args": { "External id": 13686,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260492.949, "dur": 0.420, "args": { "External id": 13687,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260494.923, "dur": 0.540, "args": { "External id": 13688,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650260512.884, "dur": 43.564, "args": { "External id": 13689,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7184 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650260589.199, "dur": 118.440, "args": { "External id": 13690,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650260599.797, "dur": 3.867, "args": { "External id": 13691,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650260608.731, "dur": 10.066, "args": { "External id": 13692,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650260613.446, "dur": 4.945, "args": { "External id": 13693,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260616.631, "dur": 0.522, "args": { "External id": 13694,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650260625.587, "dur": 30.035, "args": { "External id": 13695,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260627.607, "dur": 2.670, "args": { "External id": 13696,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260632.267, "dur": 0.408, "args": { "External id": 13697,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260633.750, "dur": 0.658, "args": { "External id": 13698,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260638.197, "dur": 1.342, "args": { "External id": 13699,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260641.106, "dur": 0.382, "args": { "External id": 13700,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260642.496, "dur": 0.194, "args": { "External id": 13701,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260646.365, "dur": 0.327, "args": { "External id": 13702,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260647.878, "dur": 0.378, "args": { "External id": 13703,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650260649.692, "dur": 2.277, "args": { "External id": 13704,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650260677.813, "dur": 21.855, "args": { "External id": 13705,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7200 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650260760.966, "dur": 447.048, "args": { "External id": 13706,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7201 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650260793.846, "dur": 409.012, "args": { "External id": 13707,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7202, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650260805.966, "dur": 390.945, "args": { "External id": 13708,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7203 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650261249.351, "dur": 3.441, "args": { "External id": 13709,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7204, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.15)", "pid": 1336754, "tid": 1336754, "ts": 1295650261350.679, "dur": 17045.176, "args": { "External id": 13710,"Record function id": 0, "Ev Idx": 7205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261455.617, "dur": 6.718, "args": { "External id": 13711,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261466.201, "dur": 1.086, "args": { "External id": 13712,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261469.108, "dur": 2.652, "args": { "External id": 13713,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261473.309, "dur": 0.770, "args": { "External id": 13714,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261475.733, "dur": 0.877, "args": { "External id": 13715,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261477.684, "dur": 0.858, "args": { "External id": 13716,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261482.506, "dur": 0.629, "args": { "External id": 13717,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261484.609, "dur": 1.783, "args": { "External id": 13718,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261487.668, "dur": 0.643, "args": { "External id": 13719,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650261490.139, "dur": 0.672, "args": { "External id": 13720,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7215 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650261510.457, "dur": 16846.041, "args": { "External id": 13721,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650261527.214, "dur": 16822.575, "args": { "External id": 13722,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650261548.185, "dur": 15.465, "args": { "External id": 13723,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650261566.877, "dur": 16749.603, "args": { "External id": 13724,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650261569.536, "dur": 16746.400, "args": { "External id": 13725,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650261575.759, "dur": 5.609, "args": { "External id": 13726,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650261583.201, "dur": 16729.564, "args": { "External id": 13727,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7222 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650278523.741, "dur": 38.424, "args": { "External id": 13728,"Sequence number": 246571, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7223 } }, { "ph": "s", "id": 197, "pid": 1336754, "tid": 1336754, "ts": 1295650278523.741, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650278549.782, "dur": 7.402, "args": { "External id": 13729,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650278552.734, "dur": 4.248, "args": { "External id": 13730,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7225 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650278626.417, "dur": 78.553, "args": { "External id": 13731,"Record function id": 0, "Ev Idx": 7226 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650278706.701, "dur": 1117.390, "args": { "External id": 13732,"Record function id": 0, "Ev Idx": 7227 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650278750.060, "dur": 1061.236, "args": { "External id": 13733,"Sequence number": 246572, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7228 } }, { "ph": "s", "id": 196, "pid": 1336754, "tid": 1336754, "ts": 1295650278750.060, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650278815.854, "dur": 42.247, "args": { "External id": 13734,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650278870.859, "dur": 104.770, "args": { "External id": 13735,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279024.834, "dur": 48.867, "args": { "External id": 13736,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279083.827, "dur": 32.326, "args": { "External id": 13737,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7232 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650279143.110, "dur": 29.638, "args": { "External id": 13738,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7233 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650279191.346, "dur": 15.772, "args": { "External id": 13739,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7234 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650279225.993, "dur": 152.147, "args": { "External id": 13740,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650279294.179, "dur": 12.878, "args": { "External id": 13741,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650279299.619, "dur": 6.616, "args": { "External id": 13742,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650279309.923, "dur": 5.647, "args": { "External id": 13743,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650279317.128, "dur": 1.250, "args": { "External id": 13744,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650279320.971, "dur": 5.065, "args": { "External id": 13745,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279388.670, "dur": 54.284, "args": { "External id": 13746,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7241 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650279476.538, "dur": 29.652, "args": { "External id": 13747,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279515.831, "dur": 43.000, "args": { "External id": 13748,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279567.760, "dur": 35.790, "args": { "External id": 13749,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7244 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650279627.323, "dur": 26.973, "args": { "External id": 13750,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650279659.998, "dur": 35.401, "args": { "External id": 13751,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7246 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650279715.589, "dur": 21.809, "args": { "External id": 13752,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7247 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.15)", "pid": 1336754, "tid": 1336754, "ts": 1295650279888.142, "dur": 73.906, "args": { "External id": 13753,"Record function id": 0, "Ev Idx": 7248 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650280077.503, "dur": 50.592, "args": { "External id": 13754,"Record function id": 0, "Ev Idx": 7249 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.16)", "pid": 1336754, "tid": 1336754, "ts": 1295650280136.915, "dur": 18187.455, "args": { "External id": 13755,"Record function id": 0, "Ev Idx": 7250 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.16)", "pid": 1336754, "tid": 1336754, "ts": 1295650280146.295, "dur": 912.871, "args": { "External id": 13756,"Record function id": 0, "Ev Idx": 7251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650280241.892, "dur": 10.959, "args": { "External id": 13757,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650280269.687, "dur": 38.496, "args": { "External id": 13758,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280275.708, "dur": 2.472, "args": { "External id": 13759,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280283.004, "dur": 0.232, "args": { "External id": 13760,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280285.261, "dur": 0.589, "args": { "External id": 13761,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280286.886, "dur": 0.401, "args": { "External id": 13762,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280290.908, "dur": 0.779, "args": { "External id": 13763,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280292.930, "dur": 0.399, "args": { "External id": 13764,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280294.927, "dur": 4.152, "args": { "External id": 13765,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280300.061, "dur": 0.184, "args": { "External id": 13766,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280301.763, "dur": 0.740, "args": { "External id": 13767,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650280323.690, "dur": 45.159, "args": { "External id": 13768,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7263 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650280403.015, "dur": 107.941, "args": { "External id": 13769,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650280414.402, "dur": 6.323, "args": { "External id": 13770,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650280426.370, "dur": 9.970, "args": { "External id": 13771,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650280431.025, "dur": 4.912, "args": { "External id": 13772,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280434.192, "dur": 0.560, "args": { "External id": 13773,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650280443.586, "dur": 26.530, "args": { "External id": 13774,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280445.410, "dur": 0.552, "args": { "External id": 13775,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280447.365, "dur": 2.436, "args": { "External id": 13776,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280451.189, "dur": 0.213, "args": { "External id": 13777,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280452.437, "dur": 1.313, "args": { "External id": 13778,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280457.318, "dur": 0.373, "args": { "External id": 13779,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280458.822, "dur": 0.622, "args": { "External id": 13780,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280460.462, "dur": 0.159, "args": { "External id": 13781,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280464.144, "dur": 0.370, "args": { "External id": 13782,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650280465.973, "dur": 0.157, "args": { "External id": 13783,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650280481.102, "dur": 21.832, "args": { "External id": 13784,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7279 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650280565.217, "dur": 362.206, "args": { "External id": 13785,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7280 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650280599.929, "dur": 322.801, "args": { "External id": 13786,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7281, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650280610.268, "dur": 307.374, "args": { "External id": 13787,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7282 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650280951.723, "dur": 2.344, "args": { "External id": 13788,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7283, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.16)", "pid": 1336754, "tid": 1336754, "ts": 1295650281082.613, "dur": 17041.247, "args": { "External id": 13789,"Record function id": 0, "Ev Idx": 7284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281182.392, "dur": 6.480, "args": { "External id": 13790,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281192.351, "dur": 1.011, "args": { "External id": 13791,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281194.919, "dur": 2.453, "args": { "External id": 13792,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281199.092, "dur": 0.737, "args": { "External id": 13793,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281201.138, "dur": 0.913, "args": { "External id": 13794,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281203.454, "dur": 0.765, "args": { "External id": 13795,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281207.984, "dur": 1.073, "args": { "External id": 13796,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281210.627, "dur": 1.762, "args": { "External id": 13797,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281213.887, "dur": 0.765, "args": { "External id": 13798,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650281216.237, "dur": 0.855, "args": { "External id": 13799,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7294 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650281252.336, "dur": 16832.710, "args": { "External id": 13800,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650281269.778, "dur": 16808.660, "args": { "External id": 13801,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650281292.129, "dur": 15.260, "args": { "External id": 13802,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650281310.562, "dur": 16733.306, "args": { "External id": 13803,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650281313.377, "dur": 16729.906, "args": { "External id": 13804,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650281319.539, "dur": 6.266, "args": { "External id": 13805,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650281327.595, "dur": 16712.665, "args": { "External id": 13806,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7301 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650298261.491, "dur": 37.018, "args": { "External id": 13807,"Sequence number": 246573, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7302 } }, { "ph": "s", "id": 195, "pid": 1336754, "tid": 1336754, "ts": 1295650298261.491, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650298285.413, "dur": 7.788, "args": { "External id": 13808,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650298288.707, "dur": 4.139, "args": { "External id": 13809,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7304 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650298363.984, "dur": 76.287, "args": { "External id": 13810,"Record function id": 0, "Ev Idx": 7305 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650298441.873, "dur": 1164.056, "args": { "External id": 13811,"Record function id": 0, "Ev Idx": 7306 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650298481.510, "dur": 1110.895, "args": { "External id": 13812,"Sequence number": 246574, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7307 } }, { "ph": "s", "id": 194, "pid": 1336754, "tid": 1336754, "ts": 1295650298481.510, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650298546.979, "dur": 42.996, "args": { "External id": 13813,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650298602.718, "dur": 104.269, "args": { "External id": 13814,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650298717.978, "dur": 39.024, "args": { "External id": 13815,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650298766.403, "dur": 31.517, "args": { "External id": 13816,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7311 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650298830.543, "dur": 31.327, "args": { "External id": 13817,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7312 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650298878.071, "dur": 17.751, "args": { "External id": 13818,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7313 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650298913.677, "dur": 175.729, "args": { "External id": 13819,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650298962.067, "dur": 10.583, "args": { "External id": 13820,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650298966.301, "dur": 5.609, "args": { "External id": 13821,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650298975.336, "dur": 45.858, "args": { "External id": 13822,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650299024.200, "dur": 1.752, "args": { "External id": 13823,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650299028.807, "dur": 6.505, "args": { "External id": 13824,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650299130.695, "dur": 59.817, "args": { "External id": 13825,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7320 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650299244.247, "dur": 34.851, "args": { "External id": 13826,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650299291.921, "dur": 48.201, "args": { "External id": 13827,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650299349.236, "dur": 35.317, "args": { "External id": 13828,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7323 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650299406.694, "dur": 27.954, "args": { "External id": 13829,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650299440.537, "dur": 41.876, "args": { "External id": 13830,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7325 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650299506.093, "dur": 18.810, "args": { "External id": 13831,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7326 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.16)", "pid": 1336754, "tid": 1336754, "ts": 1295650299672.036, "dur": 75.030, "args": { "External id": 13832,"Record function id": 0, "Ev Idx": 7327 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650299820.130, "dur": 45.610, "args": { "External id": 13833,"Record function id": 0, "Ev Idx": 7328 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.17)", "pid": 1336754, "tid": 1336754, "ts": 1295650299874.551, "dur": 18270.576, "args": { "External id": 13834,"Record function id": 0, "Ev Idx": 7329 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.17)", "pid": 1336754, "tid": 1336754, "ts": 1295650299883.878, "dur": 895.237, "args": { "External id": 13835,"Record function id": 0, "Ev Idx": 7330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650299964.759, "dur": 8.176, "args": { "External id": 13836,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650300026.300, "dur": 36.847, "args": { "External id": 13837,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300032.270, "dur": 2.605, "args": { "External id": 13838,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300040.174, "dur": 0.507, "args": { "External id": 13839,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300042.013, "dur": 0.520, "args": { "External id": 13840,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300043.856, "dur": 0.340, "args": { "External id": 13841,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300047.553, "dur": 0.285, "args": { "External id": 13842,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300049.150, "dur": 0.410, "args": { "External id": 13843,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300050.807, "dur": 3.663, "args": { "External id": 13844,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300056.017, "dur": 0.192, "args": { "External id": 13845,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300057.335, "dur": 0.174, "args": { "External id": 13846,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650300074.995, "dur": 41.719, "args": { "External id": 13847,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7342 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650300152.437, "dur": 128.607, "args": { "External id": 13848,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650300163.562, "dur": 4.842, "args": { "External id": 13849,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650300173.896, "dur": 10.011, "args": { "External id": 13850,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650300178.515, "dur": 4.957, "args": { "External id": 13851,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300181.775, "dur": 0.469, "args": { "External id": 13852,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650300191.289, "dur": 28.724, "args": { "External id": 13853,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300193.201, "dur": 2.622, "args": { "External id": 13854,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300197.522, "dur": 0.219, "args": { "External id": 13855,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300198.941, "dur": 0.400, "args": { "External id": 13856,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300203.071, "dur": 1.189, "args": { "External id": 13857,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300205.903, "dur": 0.161, "args": { "External id": 13858,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300207.402, "dur": 0.182, "args": { "External id": 13859,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300210.325, "dur": 0.220, "args": { "External id": 13860,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300211.960, "dur": 0.430, "args": { "External id": 13861,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650300213.399, "dur": 2.801, "args": { "External id": 13862,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650300246.971, "dur": 25.289, "args": { "External id": 13863,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7358 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650300338.354, "dur": 351.467, "args": { "External id": 13864,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7359 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650300373.031, "dur": 312.107, "args": { "External id": 13865,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7360, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650300383.299, "dur": 296.741, "args": { "External id": 13866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7361 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650300712.388, "dur": 2.173, "args": { "External id": 13867,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7362, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.17)", "pid": 1336754, "tid": 1336754, "ts": 1295650300799.287, "dur": 17122.470, "args": { "External id": 13868,"Record function id": 0, "Ev Idx": 7363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300896.219, "dur": 5.682, "args": { "External id": 13869,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300905.200, "dur": 0.731, "args": { "External id": 13870,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300907.714, "dur": 1.742, "args": { "External id": 13871,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300911.168, "dur": 0.779, "args": { "External id": 13872,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300913.348, "dur": 0.765, "args": { "External id": 13873,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300915.260, "dur": 0.582, "args": { "External id": 13874,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300919.591, "dur": 0.536, "args": { "External id": 13875,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300921.520, "dur": 1.759, "args": { "External id": 13876,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300925.159, "dur": 0.747, "args": { "External id": 13877,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650300927.241, "dur": 0.639, "args": { "External id": 13878,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7373 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650300947.626, "dur": 16933.027, "args": { "External id": 13879,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650300963.562, "dur": 16910.011, "args": { "External id": 13880,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650301023.047, "dur": 15.290, "args": { "External id": 13881,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650301041.837, "dur": 16796.196, "args": { "External id": 13882,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650301044.423, "dur": 16793.089, "args": { "External id": 13883,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650301050.070, "dur": 6.020, "args": { "External id": 13884,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650301057.781, "dur": 16776.836, "args": { "External id": 13885,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7380 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650318077.460, "dur": 40.302, "args": { "External id": 13886,"Sequence number": 246575, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7381 } }, { "ph": "s", "id": 193, "pid": 1336754, "tid": 1336754, "ts": 1295650318077.460, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650318104.323, "dur": 7.999, "args": { "External id": 13887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650318107.544, "dur": 4.459, "args": { "External id": 13888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7383 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650318185.434, "dur": 88.714, "args": { "External id": 13889,"Record function id": 0, "Ev Idx": 7384 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650318277.609, "dur": 1103.196, "args": { "External id": 13890,"Record function id": 0, "Ev Idx": 7385 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650318318.997, "dur": 1047.664, "args": { "External id": 13891,"Sequence number": 246576, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7386 } }, { "ph": "s", "id": 192, "pid": 1336754, "tid": 1336754, "ts": 1295650318318.997, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650318385.971, "dur": 47.269, "args": { "External id": 13892,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650318446.102, "dur": 105.687, "args": { "External id": 13893,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650318561.375, "dur": 39.284, "args": { "External id": 13894,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650318610.034, "dur": 31.004, "args": { "External id": 13895,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7390 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650318666.960, "dur": 28.146, "args": { "External id": 13896,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7391 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650318713.216, "dur": 16.357, "args": { "External id": 13897,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7392 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650318747.586, "dur": 127.899, "args": { "External id": 13898,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650318797.330, "dur": 11.120, "args": { "External id": 13899,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650318802.103, "dur": 5.451, "args": { "External id": 13900,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650318811.348, "dur": 5.578, "args": { "External id": 13901,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650318818.085, "dur": 1.368, "args": { "External id": 13902,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650318822.175, "dur": 3.846, "args": { "External id": 13903,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650318885.677, "dur": 47.068, "args": { "External id": 13904,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7399 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650318963.014, "dur": 71.161, "args": { "External id": 13905,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650319047.035, "dur": 46.282, "args": { "External id": 13906,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650319102.781, "dur": 35.521, "args": { "External id": 13907,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7402 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650319163.023, "dur": 30.687, "args": { "External id": 13908,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650319199.607, "dur": 49.555, "args": { "External id": 13909,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7404 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650319273.869, "dur": 21.435, "args": { "External id": 13910,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7405 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.17)", "pid": 1336754, "tid": 1336754, "ts": 1295650319444.026, "dur": 75.203, "args": { "External id": 13911,"Record function id": 0, "Ev Idx": 7406 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650319589.766, "dur": 45.453, "args": { "External id": 13912,"Record function id": 0, "Ev Idx": 7407 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.18)", "pid": 1336754, "tid": 1336754, "ts": 1295650319644.655, "dur": 18284.521, "args": { "External id": 13913,"Record function id": 0, "Ev Idx": 7408 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.18)", "pid": 1336754, "tid": 1336754, "ts": 1295650319654.607, "dur": 904.102, "args": { "External id": 13914,"Record function id": 0, "Ev Idx": 7409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650319737.410, "dur": 7.733, "args": { "External id": 13915,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650319759.495, "dur": 34.168, "args": { "External id": 13916,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319764.613, "dur": 2.267, "args": { "External id": 13917,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319771.625, "dur": 0.528, "args": { "External id": 13918,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319773.232, "dur": 0.490, "args": { "External id": 13919,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319775.413, "dur": 0.435, "args": { "External id": 13920,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319779.008, "dur": 0.448, "args": { "External id": 13921,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319781.198, "dur": 0.183, "args": { "External id": 13922,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319782.303, "dur": 3.089, "args": { "External id": 13923,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319786.774, "dur": 0.200, "args": { "External id": 13924,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319788.087, "dur": 0.162, "args": { "External id": 13925,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650319805.443, "dur": 40.657, "args": { "External id": 13926,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7421 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650319879.001, "dur": 150.529, "args": { "External id": 13927,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650319892.590, "dur": 5.839, "args": { "External id": 13928,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650319903.406, "dur": 9.978, "args": { "External id": 13929,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650319907.759, "dur": 5.199, "args": { "External id": 13930,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319911.290, "dur": 0.496, "args": { "External id": 13931,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650319920.619, "dur": 28.070, "args": { "External id": 13932,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319922.426, "dur": 0.446, "args": { "External id": 13933,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319925.134, "dur": 2.688, "args": { "External id": 13934,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319928.956, "dur": 0.249, "args": { "External id": 13935,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319930.846, "dur": 0.219, "args": { "External id": 13936,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319934.198, "dur": 0.821, "args": { "External id": 13937,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319936.540, "dur": 0.613, "args": { "External id": 13938,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319938.071, "dur": 0.453, "args": { "External id": 13939,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319942.085, "dur": 0.581, "args": { "External id": 13940,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650319944.085, "dur": 0.853, "args": { "External id": 13941,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650319960.217, "dur": 58.631, "args": { "External id": 13942,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7437 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650320087.536, "dur": 375.547, "args": { "External id": 13943,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7438 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650320122.272, "dur": 335.959, "args": { "External id": 13944,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7439, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650320133.001, "dur": 319.654, "args": { "External id": 13945,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7440 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650320489.387, "dur": 2.199, "args": { "External id": 13946,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7441, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.18)", "pid": 1336754, "tid": 1336754, "ts": 1295650320579.622, "dur": 17163.309, "args": { "External id": 13947,"Record function id": 0, "Ev Idx": 7442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320675.948, "dur": 6.910, "args": { "External id": 13948,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320686.422, "dur": 2.150, "args": { "External id": 13949,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320690.556, "dur": 1.098, "args": { "External id": 13950,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320693.396, "dur": 0.990, "args": { "External id": 13951,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320696.016, "dur": 0.871, "args": { "External id": 13952,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320698.253, "dur": 0.842, "args": { "External id": 13953,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320702.487, "dur": 1.149, "args": { "External id": 13954,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320705.445, "dur": 2.063, "args": { "External id": 13955,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320708.843, "dur": 0.845, "args": { "External id": 13956,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650320711.281, "dur": 1.077, "args": { "External id": 13957,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7452 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650320732.774, "dur": 16970.920, "args": { "External id": 13958,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650320749.079, "dur": 16947.972, "args": { "External id": 13959,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650320769.343, "dur": 13.883, "args": { "External id": 13960,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650320786.360, "dur": 16877.300, "args": { "External id": 13961,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650320788.606, "dur": 16874.517, "args": { "External id": 13962,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650320794.750, "dur": 5.486, "args": { "External id": 13963,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650320801.876, "dur": 16858.213, "args": { "External id": 13964,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7459 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650337868.900, "dur": 36.046, "args": { "External id": 13965,"Sequence number": 246577, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7460 } }, { "ph": "s", "id": 191, "pid": 1336754, "tid": 1336754, "ts": 1295650337868.900, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650337892.146, "dur": 7.577, "args": { "External id": 13966,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650337895.307, "dur": 4.165, "args": { "External id": 13967,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7462 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650337968.332, "dur": 104.214, "args": { "External id": 13968,"Record function id": 0, "Ev Idx": 7463 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650338075.958, "dur": 1105.136, "args": { "External id": 13969,"Record function id": 0, "Ev Idx": 7464 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650338118.233, "dur": 1049.020, "args": { "External id": 13970,"Sequence number": 246578, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7465 } }, { "ph": "s", "id": 190, "pid": 1336754, "tid": 1336754, "ts": 1295650338118.233, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650338193.863, "dur": 57.638, "args": { "External id": 13971,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338270.291, "dur": 106.738, "args": { "External id": 13972,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338387.082, "dur": 40.765, "args": { "External id": 13973,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338434.960, "dur": 31.481, "args": { "External id": 13974,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7469 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650338495.685, "dur": 27.966, "args": { "External id": 13975,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7470 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650338540.494, "dur": 20.162, "args": { "External id": 13976,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7471 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650338576.312, "dur": 132.972, "args": { "External id": 13977,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650338628.670, "dur": 11.407, "args": { "External id": 13978,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650338633.479, "dur": 5.943, "args": { "External id": 13979,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650338642.893, "dur": 5.567, "args": { "External id": 13980,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650338650.009, "dur": 3.384, "args": { "External id": 13981,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650338655.667, "dur": 3.109, "args": { "External id": 13982,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338719.890, "dur": 46.689, "args": { "External id": 13983,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7478 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650338799.134, "dur": 27.693, "args": { "External id": 13984,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338835.887, "dur": 42.398, "args": { "External id": 13985,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338885.505, "dur": 34.194, "args": { "External id": 13986,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7481 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650338945.672, "dur": 27.672, "args": { "External id": 13987,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650338979.276, "dur": 75.513, "args": { "External id": 13988,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7483 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650339078.916, "dur": 23.456, "args": { "External id": 13989,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7484 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.18)", "pid": 1336754, "tid": 1336754, "ts": 1295650339260.358, "dur": 74.329, "args": { "External id": 13990,"Record function id": 0, "Ev Idx": 7485 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650339409.806, "dur": 47.349, "args": { "External id": 13991,"Record function id": 0, "Ev Idx": 7486 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.19)", "pid": 1336754, "tid": 1336754, "ts": 1295650339466.674, "dur": 18337.241, "args": { "External id": 13992,"Record function id": 0, "Ev Idx": 7487 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.19)", "pid": 1336754, "tid": 1336754, "ts": 1295650339475.429, "dur": 941.921, "args": { "External id": 13993,"Record function id": 0, "Ev Idx": 7488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650339552.993, "dur": 9.587, "args": { "External id": 13994,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650339576.755, "dur": 38.290, "args": { "External id": 13995,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339583.015, "dur": 2.421, "args": { "External id": 13996,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339590.099, "dur": 0.497, "args": { "External id": 13997,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339592.084, "dur": 0.653, "args": { "External id": 13998,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339593.954, "dur": 0.680, "args": { "External id": 13999,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339598.518, "dur": 0.955, "args": { "External id": 14000,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339600.674, "dur": 0.666, "args": { "External id": 14001,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339602.867, "dur": 2.549, "args": { "External id": 14002,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339606.498, "dur": 0.486, "args": { "External id": 14003,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339608.607, "dur": 0.787, "args": { "External id": 14004,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650339626.156, "dur": 40.166, "args": { "External id": 14005,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7500 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650339698.512, "dur": 108.892, "args": { "External id": 14006,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650339708.724, "dur": 4.577, "args": { "External id": 14007,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650339718.625, "dur": 10.500, "args": { "External id": 14008,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650339723.029, "dur": 5.670, "args": { "External id": 14009,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339726.133, "dur": 1.107, "args": { "External id": 14010,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650339735.927, "dur": 29.927, "args": { "External id": 14011,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339738.193, "dur": 2.326, "args": { "External id": 14012,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339741.569, "dur": 0.491, "args": { "External id": 14013,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339743.654, "dur": 0.505, "args": { "External id": 14014,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339747.619, "dur": 0.701, "args": { "External id": 14015,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339749.599, "dur": 0.696, "args": { "External id": 14016,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339751.227, "dur": 0.538, "args": { "External id": 14017,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339755.585, "dur": 0.883, "args": { "External id": 14018,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339757.639, "dur": 0.556, "args": { "External id": 14019,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650339759.470, "dur": 2.758, "args": { "External id": 14020,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650339778.421, "dur": 21.303, "args": { "External id": 14021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7516 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650339858.953, "dur": 452.949, "args": { "External id": 14022,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7517 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650339893.739, "dur": 412.155, "args": { "External id": 14023,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7518, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650339903.829, "dur": 395.372, "args": { "External id": 14024,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7519 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650340339.319, "dur": 2.408, "args": { "External id": 14025,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7520, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.19)", "pid": 1336754, "tid": 1336754, "ts": 1295650340439.724, "dur": 17168.739, "args": { "External id": 14026,"Record function id": 0, "Ev Idx": 7521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340541.844, "dur": 6.856, "args": { "External id": 14027,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340561.550, "dur": 1.531, "args": { "External id": 14028,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340564.716, "dur": 1.297, "args": { "External id": 14029,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340569.390, "dur": 1.110, "args": { "External id": 14030,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340571.665, "dur": 0.925, "args": { "External id": 14031,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340574.048, "dur": 0.907, "args": { "External id": 14032,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340576.579, "dur": 0.954, "args": { "External id": 14033,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340581.591, "dur": 2.139, "args": { "External id": 14034,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340585.165, "dur": 1.055, "args": { "External id": 14035,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650340588.018, "dur": 1.030, "args": { "External id": 14036,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7531 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650340608.969, "dur": 16960.358, "args": { "External id": 14037,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650340624.984, "dur": 16937.450, "args": { "External id": 14038,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650340643.321, "dur": 14.245, "args": { "External id": 14039,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650340662.874, "dur": 16864.723, "args": { "External id": 14040,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650340665.016, "dur": 16861.885, "args": { "External id": 14041,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650340671.444, "dur": 5.740, "args": { "External id": 14042,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650340679.146, "dur": 16844.748, "args": { "External id": 14043,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7538 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650357739.736, "dur": 38.825, "args": { "External id": 14044,"Sequence number": 246579, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7539 } }, { "ph": "s", "id": 189, "pid": 1336754, "tid": 1336754, "ts": 1295650357739.736, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650357765.296, "dur": 8.000, "args": { "External id": 14045,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650357768.571, "dur": 4.469, "args": { "External id": 14046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7541 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650357844.929, "dur": 79.331, "args": { "External id": 14047,"Record function id": 0, "Ev Idx": 7542 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650357925.780, "dur": 1130.838, "args": { "External id": 14048,"Record function id": 0, "Ev Idx": 7543 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650357965.396, "dur": 1076.250, "args": { "External id": 14049,"Sequence number": 246580, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7544 } }, { "ph": "s", "id": 188, "pid": 1336754, "tid": 1336754, "ts": 1295650357965.396, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650358067.111, "dur": 45.273, "args": { "External id": 14050,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358126.185, "dur": 118.646, "args": { "External id": 14051,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358257.284, "dur": 44.039, "args": { "External id": 14052,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358311.785, "dur": 31.963, "args": { "External id": 14053,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7548 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650358369.009, "dur": 30.630, "args": { "External id": 14054,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7549 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650358420.571, "dur": 15.530, "args": { "External id": 14055,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7550 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650358454.359, "dur": 131.367, "args": { "External id": 14056,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650358506.899, "dur": 11.532, "args": { "External id": 14057,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650358511.519, "dur": 6.137, "args": { "External id": 14058,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650358521.140, "dur": 6.107, "args": { "External id": 14059,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650358528.923, "dur": 1.836, "args": { "External id": 14060,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650358532.977, "dur": 2.727, "args": { "External id": 14061,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358597.690, "dur": 47.724, "args": { "External id": 14062,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7557 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650358676.818, "dur": 28.842, "args": { "External id": 14063,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358714.742, "dur": 42.516, "args": { "External id": 14064,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358766.929, "dur": 35.633, "args": { "External id": 14065,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7560 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650358826.877, "dur": 27.621, "args": { "External id": 14066,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650358860.556, "dur": 34.962, "args": { "External id": 14067,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7562 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650358919.014, "dur": 19.892, "args": { "External id": 14068,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7563 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.19)", "pid": 1336754, "tid": 1336754, "ts": 1295650359121.394, "dur": 75.729, "args": { "External id": 14069,"Record function id": 0, "Ev Idx": 7564 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650359287.885, "dur": 48.887, "args": { "External id": 14070,"Record function id": 0, "Ev Idx": 7565 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.20)", "pid": 1336754, "tid": 1336754, "ts": 1295650359346.378, "dur": 18492.355, "args": { "External id": 14071,"Record function id": 0, "Ev Idx": 7566 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.20)", "pid": 1336754, "tid": 1336754, "ts": 1295650359355.158, "dur": 902.941, "args": { "External id": 14072,"Record function id": 0, "Ev Idx": 7567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650359435.591, "dur": 9.648, "args": { "External id": 14073,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650359459.586, "dur": 38.146, "args": { "External id": 14074,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359465.357, "dur": 2.684, "args": { "External id": 14075,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359473.368, "dur": 0.612, "args": { "External id": 14076,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359475.499, "dur": 0.525, "args": { "External id": 14077,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359477.001, "dur": 0.790, "args": { "External id": 14078,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359481.528, "dur": 0.637, "args": { "External id": 14079,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359483.744, "dur": 0.651, "args": { "External id": 14080,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359485.928, "dur": 2.747, "args": { "External id": 14081,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359489.887, "dur": 0.581, "args": { "External id": 14082,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359491.919, "dur": 0.547, "args": { "External id": 14083,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650359508.448, "dur": 43.925, "args": { "External id": 14084,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7579 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650359584.804, "dur": 111.558, "args": { "External id": 14085,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650359596.163, "dur": 4.602, "args": { "External id": 14086,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650359606.080, "dur": 9.596, "args": { "External id": 14087,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650359610.216, "dur": 5.075, "args": { "External id": 14088,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359613.407, "dur": 0.632, "args": { "External id": 14089,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650359622.034, "dur": 34.251, "args": { "External id": 14090,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359623.908, "dur": 3.491, "args": { "External id": 14091,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359628.963, "dur": 0.886, "args": { "External id": 14092,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359634.581, "dur": 0.473, "args": { "External id": 14093,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359638.228, "dur": 0.706, "args": { "External id": 14094,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359640.217, "dur": 0.621, "args": { "External id": 14095,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359642.213, "dur": 2.247, "args": { "External id": 14096,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359646.019, "dur": 0.456, "args": { "External id": 14097,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359647.801, "dur": 0.406, "args": { "External id": 14098,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650359651.922, "dur": 0.647, "args": { "External id": 14099,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650359665.597, "dur": 22.762, "args": { "External id": 14100,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7595 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650359748.629, "dur": 395.852, "args": { "External id": 14101,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7596 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650359780.847, "dur": 358.195, "args": { "External id": 14102,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7597, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650359791.368, "dur": 341.786, "args": { "External id": 14103,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7598 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650360171.085, "dur": 2.385, "args": { "External id": 14104,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7599, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.20)", "pid": 1336754, "tid": 1336754, "ts": 1295650360281.065, "dur": 17367.815, "args": { "External id": 14105,"Record function id": 0, "Ev Idx": 7600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360380.933, "dur": 7.078, "args": { "External id": 14106,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360391.639, "dur": 1.160, "args": { "External id": 14107,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360394.494, "dur": 1.110, "args": { "External id": 14108,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360397.115, "dur": 0.994, "args": { "External id": 14109,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360399.559, "dur": 0.955, "args": { "External id": 14110,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360401.841, "dur": 0.793, "args": { "External id": 14111,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360406.611, "dur": 1.360, "args": { "External id": 14112,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360409.467, "dur": 1.879, "args": { "External id": 14113,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360413.485, "dur": 1.057, "args": { "External id": 14114,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650360415.879, "dur": 1.136, "args": { "External id": 14115,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7610 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650360437.812, "dur": 17172.403, "args": { "External id": 14116,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650360453.268, "dur": 17150.255, "args": { "External id": 14117,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650360473.740, "dur": 14.363, "args": { "External id": 14118,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650360491.004, "dur": 17077.191, "args": { "External id": 14119,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650360493.678, "dur": 17073.998, "args": { "External id": 14120,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650360500.114, "dur": 5.725, "args": { "External id": 14121,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650360507.417, "dur": 17056.803, "args": { "External id": 14122,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7617 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650377774.755, "dur": 40.607, "args": { "External id": 14123,"Sequence number": 246581, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7618 } }, { "ph": "s", "id": 187, "pid": 1336754, "tid": 1336754, "ts": 1295650377774.755, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650377802.268, "dur": 7.765, "args": { "External id": 14124,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650377805.362, "dur": 4.426, "args": { "External id": 14125,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7620 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650377876.684, "dur": 78.548, "args": { "External id": 14126,"Record function id": 0, "Ev Idx": 7621 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650377956.672, "dur": 1144.160, "args": { "External id": 14127,"Record function id": 0, "Ev Idx": 7622 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650378027.601, "dur": 1059.226, "args": { "External id": 14128,"Sequence number": 246582, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7623 } }, { "ph": "s", "id": 186, "pid": 1336754, "tid": 1336754, "ts": 1295650378027.601, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650378098.529, "dur": 44.913, "args": { "External id": 14129,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378156.555, "dur": 126.324, "args": { "External id": 14130,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378297.094, "dur": 43.405, "args": { "External id": 14131,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378348.160, "dur": 32.695, "args": { "External id": 14132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7627 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650378411.427, "dur": 28.286, "args": { "External id": 14133,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7628 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650378457.414, "dur": 17.114, "args": { "External id": 14134,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7629 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650378491.916, "dur": 134.722, "args": { "External id": 14135,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650378543.808, "dur": 11.891, "args": { "External id": 14136,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650378549.017, "dur": 5.942, "args": { "External id": 14137,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650378558.318, "dur": 6.038, "args": { "External id": 14138,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650378565.581, "dur": 1.361, "args": { "External id": 14139,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650378572.141, "dur": 3.047, "args": { "External id": 14140,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378638.948, "dur": 50.319, "args": { "External id": 14141,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7636 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650378721.689, "dur": 30.928, "args": { "External id": 14142,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378762.162, "dur": 42.505, "args": { "External id": 14143,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378811.692, "dur": 35.114, "args": { "External id": 14144,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7639 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650378871.541, "dur": 30.613, "args": { "External id": 14145,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650378908.194, "dur": 34.642, "args": { "External id": 14146,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7641 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650378961.763, "dur": 18.272, "args": { "External id": 14147,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7642 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.20)", "pid": 1336754, "tid": 1336754, "ts": 1295650379165.449, "dur": 93.792, "args": { "External id": 14148,"Record function id": 0, "Ev Idx": 7643 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650379337.038, "dur": 47.653, "args": { "External id": 14149,"Record function id": 0, "Ev Idx": 7644 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.21)", "pid": 1336754, "tid": 1336754, "ts": 1295650379393.004, "dur": 18189.647, "args": { "External id": 14150,"Record function id": 0, "Ev Idx": 7645 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.21)", "pid": 1336754, "tid": 1336754, "ts": 1295650379403.578, "dur": 936.134, "args": { "External id": 14151,"Record function id": 0, "Ev Idx": 7646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650379482.890, "dur": 9.713, "args": { "External id": 14152,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650379507.496, "dur": 35.454, "args": { "External id": 14153,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379512.504, "dur": 2.487, "args": { "External id": 14154,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379519.980, "dur": 0.658, "args": { "External id": 14155,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379521.736, "dur": 0.559, "args": { "External id": 14156,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379523.614, "dur": 0.609, "args": { "External id": 14157,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379526.868, "dur": 0.690, "args": { "External id": 14158,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379529.190, "dur": 0.892, "args": { "External id": 14159,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379531.093, "dur": 2.430, "args": { "External id": 14160,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379534.759, "dur": 0.501, "args": { "External id": 14161,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379536.405, "dur": 0.575, "args": { "External id": 14162,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650379554.516, "dur": 42.052, "args": { "External id": 14163,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7658 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650379629.118, "dur": 110.916, "args": { "External id": 14164,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650379639.947, "dur": 4.621, "args": { "External id": 14165,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650379649.422, "dur": 10.335, "args": { "External id": 14166,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650379653.870, "dur": 5.494, "args": { "External id": 14167,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379657.542, "dur": 0.648, "args": { "External id": 14168,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650379666.236, "dur": 29.432, "args": { "External id": 14169,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379668.126, "dur": 2.617, "args": { "External id": 14170,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379672.049, "dur": 0.947, "args": { "External id": 14171,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379674.276, "dur": 0.623, "args": { "External id": 14172,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379678.702, "dur": 0.641, "args": { "External id": 14173,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379680.124, "dur": 0.775, "args": { "External id": 14174,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379682.331, "dur": 0.407, "args": { "External id": 14175,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379685.454, "dur": 0.578, "args": { "External id": 14176,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379687.516, "dur": 0.473, "args": { "External id": 14177,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650379689.022, "dur": 2.695, "args": { "External id": 14178,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650379709.394, "dur": 22.877, "args": { "External id": 14179,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7674 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650379802.630, "dur": 419.052, "args": { "External id": 14180,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7675 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650379834.375, "dur": 381.392, "args": { "External id": 14181,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7676, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650379844.705, "dur": 362.388, "args": { "External id": 14182,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7677 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650380262.877, "dur": 3.310, "args": { "External id": 14183,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7678, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.21)", "pid": 1336754, "tid": 1336754, "ts": 1295650380359.781, "dur": 17031.542, "args": { "External id": 14184,"Record function id": 0, "Ev Idx": 7679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380456.583, "dur": 6.178, "args": { "External id": 14185,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380466.015, "dur": 1.220, "args": { "External id": 14186,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380468.804, "dur": 1.100, "args": { "External id": 14187,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380471.587, "dur": 0.838, "args": { "External id": 14188,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380473.804, "dur": 1.304, "args": { "External id": 14189,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380478.544, "dur": 1.133, "args": { "External id": 14190,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380481.324, "dur": 1.071, "args": { "External id": 14191,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380483.804, "dur": 1.752, "args": { "External id": 14192,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380487.372, "dur": 0.496, "args": { "External id": 14193,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650380491.141, "dur": 0.842, "args": { "External id": 14194,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7689 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650380509.606, "dur": 16843.605, "args": { "External id": 14195,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650380525.314, "dur": 16821.388, "args": { "External id": 14196,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650380545.513, "dur": 13.759, "args": { "External id": 14197,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650380562.277, "dur": 16748.230, "args": { "External id": 14198,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650380564.773, "dur": 16745.212, "args": { "External id": 14199,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650380570.481, "dur": 7.218, "args": { "External id": 14200,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650380579.395, "dur": 16727.582, "args": { "External id": 14201,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7696 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650397521.437, "dur": 35.601, "args": { "External id": 14202,"Sequence number": 246583, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7697 } }, { "ph": "s", "id": 185, "pid": 1336754, "tid": 1336754, "ts": 1295650397521.437, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650397544.809, "dur": 7.163, "args": { "External id": 14203,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650397547.870, "dur": 3.868, "args": { "External id": 14204,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7699 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650397621.828, "dur": 77.589, "args": { "External id": 14205,"Record function id": 0, "Ev Idx": 7700 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650397701.008, "dur": 1101.251, "args": { "External id": 14206,"Record function id": 0, "Ev Idx": 7701 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650397738.975, "dur": 1049.674, "args": { "External id": 14207,"Sequence number": 246584, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7702 } }, { "ph": "s", "id": 184, "pid": 1336754, "tid": 1336754, "ts": 1295650397738.975, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650397804.799, "dur": 42.709, "args": { "External id": 14208,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650397860.165, "dur": 102.351, "args": { "External id": 14209,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650397971.195, "dur": 83.109, "args": { "External id": 14210,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650398067.261, "dur": 34.060, "args": { "External id": 14211,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7706 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650398128.724, "dur": 29.658, "args": { "External id": 14212,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7707 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650398176.488, "dur": 15.507, "args": { "External id": 14213,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7708 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650398209.788, "dur": 151.634, "args": { "External id": 14214,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650398278.213, "dur": 12.971, "args": { "External id": 14215,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650398282.989, "dur": 7.114, "args": { "External id": 14216,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650398294.122, "dur": 6.846, "args": { "External id": 14217,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650398302.220, "dur": 1.753, "args": { "External id": 14218,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650398306.530, "dur": 2.726, "args": { "External id": 14219,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650398372.429, "dur": 52.607, "args": { "External id": 14220,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7715 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650398458.074, "dur": 28.369, "args": { "External id": 14221,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650398495.180, "dur": 41.487, "args": { "External id": 14222,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650398545.896, "dur": 35.544, "args": { "External id": 14223,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7718 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650398606.926, "dur": 26.997, "args": { "External id": 14224,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650398640.668, "dur": 35.749, "args": { "External id": 14225,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7720 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650398698.969, "dur": 19.465, "args": { "External id": 14226,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7721 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.21)", "pid": 1336754, "tid": 1336754, "ts": 1295650398865.605, "dur": 70.883, "args": { "External id": 14227,"Record function id": 0, "Ev Idx": 7722 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650399049.882, "dur": 49.605, "args": { "External id": 14228,"Record function id": 0, "Ev Idx": 7723 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.22)", "pid": 1336754, "tid": 1336754, "ts": 1295650399108.687, "dur": 18143.360, "args": { "External id": 14229,"Record function id": 0, "Ev Idx": 7724 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.22)", "pid": 1336754, "tid": 1336754, "ts": 1295650399117.907, "dur": 945.996, "args": { "External id": 14230,"Record function id": 0, "Ev Idx": 7725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650399198.218, "dur": 9.341, "args": { "External id": 14231,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650399221.758, "dur": 53.783, "args": { "External id": 14232,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399240.707, "dur": 2.683, "args": { "External id": 14233,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399248.800, "dur": 0.855, "args": { "External id": 14234,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399251.081, "dur": 0.752, "args": { "External id": 14235,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399253.481, "dur": 0.705, "args": { "External id": 14236,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399257.566, "dur": 0.933, "args": { "External id": 14237,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399259.866, "dur": 0.852, "args": { "External id": 14238,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399262.089, "dur": 2.557, "args": { "External id": 14239,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399266.315, "dur": 1.049, "args": { "External id": 14240,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399268.942, "dur": 0.666, "args": { "External id": 14241,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650399287.393, "dur": 42.519, "args": { "External id": 14242,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7737 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650399364.364, "dur": 116.606, "args": { "External id": 14243,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650399375.383, "dur": 5.377, "args": { "External id": 14244,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650399385.916, "dur": 11.003, "args": { "External id": 14245,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650399390.714, "dur": 5.769, "args": { "External id": 14246,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399394.146, "dur": 1.024, "args": { "External id": 14247,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650399404.469, "dur": 33.181, "args": { "External id": 14248,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399406.597, "dur": 2.587, "args": { "External id": 14249,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399411.010, "dur": 0.946, "args": { "External id": 14250,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399413.119, "dur": 0.706, "args": { "External id": 14251,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399417.247, "dur": 0.473, "args": { "External id": 14252,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399418.889, "dur": 0.398, "args": { "External id": 14253,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399420.640, "dur": 0.632, "args": { "External id": 14254,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399424.235, "dur": 1.225, "args": { "External id": 14255,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399426.506, "dur": 1.126, "args": { "External id": 14256,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650399431.554, "dur": 2.206, "args": { "External id": 14257,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650399450.798, "dur": 22.322, "args": { "External id": 14258,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7753 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650399536.660, "dur": 394.299, "args": { "External id": 14259,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7754 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650399567.454, "dur": 358.297, "args": { "External id": 14260,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7755, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650399578.016, "dur": 341.458, "args": { "External id": 14261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7756 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650399956.421, "dur": 2.730, "args": { "External id": 14262,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7757, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.22)", "pid": 1336754, "tid": 1336754, "ts": 1295650400087.255, "dur": 16951.456, "args": { "External id": 14263,"Record function id": 0, "Ev Idx": 7758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400187.226, "dur": 6.664, "args": { "External id": 14264,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400197.165, "dur": 1.403, "args": { "External id": 14265,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400200.552, "dur": 1.007, "args": { "External id": 14266,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400203.245, "dur": 0.923, "args": { "External id": 14267,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400205.843, "dur": 1.107, "args": { "External id": 14268,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400208.237, "dur": 0.944, "args": { "External id": 14269,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400213.111, "dur": 1.268, "args": { "External id": 14270,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400216.305, "dur": 2.111, "args": { "External id": 14271,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400219.973, "dur": 1.091, "args": { "External id": 14272,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650400222.730, "dur": 0.788, "args": { "External id": 14273,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7768 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650400259.052, "dur": 16716.306, "args": { "External id": 14274,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650400282.303, "dur": 16686.255, "args": { "External id": 14275,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650400301.453, "dur": 13.588, "args": { "External id": 14276,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650400318.380, "dur": 16614.365, "args": { "External id": 14277,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650400320.822, "dur": 16611.386, "args": { "External id": 14278,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650400327.489, "dur": 8.138, "args": { "External id": 14279,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650400337.249, "dur": 16591.995, "args": { "External id": 14280,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7775 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650417174.785, "dur": 39.764, "args": { "External id": 14281,"Sequence number": 246585, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7776 } }, { "ph": "s", "id": 183, "pid": 1336754, "tid": 1336754, "ts": 1295650417174.785, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650417200.754, "dur": 8.555, "args": { "External id": 14282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650417204.029, "dur": 5.019, "args": { "External id": 14283,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7778 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650417293.244, "dur": 77.938, "args": { "External id": 14284,"Record function id": 0, "Ev Idx": 7779 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650417373.161, "dur": 1119.421, "args": { "External id": 14285,"Record function id": 0, "Ev Idx": 7780 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650417414.143, "dur": 1064.580, "args": { "External id": 14286,"Sequence number": 246586, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7781 } }, { "ph": "s", "id": 182, "pid": 1336754, "tid": 1336754, "ts": 1295650417414.143, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650417485.711, "dur": 44.319, "args": { "External id": 14287,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650417542.857, "dur": 107.012, "args": { "External id": 14288,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650417658.639, "dur": 39.144, "args": { "External id": 14289,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650417707.369, "dur": 31.399, "args": { "External id": 14290,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7785 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650417765.396, "dur": 26.592, "args": { "External id": 14291,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7786 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650417812.397, "dur": 17.416, "args": { "External id": 14292,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7787 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650417846.563, "dur": 129.974, "args": { "External id": 14293,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650417897.395, "dur": 11.895, "args": { "External id": 14294,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650417902.105, "dur": 6.501, "args": { "External id": 14295,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650417911.708, "dur": 6.094, "args": { "External id": 14296,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650417919.195, "dur": 1.638, "args": { "External id": 14297,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650417923.048, "dur": 3.215, "args": { "External id": 14298,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650418027.545, "dur": 55.251, "args": { "External id": 14299,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7794 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650418116.585, "dur": 29.859, "args": { "External id": 14300,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650418155.447, "dur": 44.292, "args": { "External id": 14301,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650418209.163, "dur": 49.957, "args": { "External id": 14302,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7797 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650418286.319, "dur": 29.547, "args": { "External id": 14303,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650418323.352, "dur": 37.912, "args": { "External id": 14304,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7799 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650418382.596, "dur": 24.311, "args": { "External id": 14305,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7800 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.22)", "pid": 1336754, "tid": 1336754, "ts": 1295650418556.066, "dur": 70.907, "args": { "External id": 14306,"Record function id": 0, "Ev Idx": 7801 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650418698.865, "dur": 45.497, "args": { "External id": 14307,"Record function id": 0, "Ev Idx": 7802 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.23)", "pid": 1336754, "tid": 1336754, "ts": 1295650418752.725, "dur": 18168.245, "args": { "External id": 14308,"Record function id": 0, "Ev Idx": 7803 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.23)", "pid": 1336754, "tid": 1336754, "ts": 1295650418762.023, "dur": 937.989, "args": { "External id": 14309,"Record function id": 0, "Ev Idx": 7804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650418838.193, "dur": 8.811, "args": { "External id": 14310,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650418861.528, "dur": 38.378, "args": { "External id": 14311,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418866.990, "dur": 2.169, "args": { "External id": 14312,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418873.151, "dur": 1.183, "args": { "External id": 14313,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418876.244, "dur": 0.696, "args": { "External id": 14314,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418878.344, "dur": 1.021, "args": { "External id": 14315,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418882.713, "dur": 0.984, "args": { "External id": 14316,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418884.937, "dur": 0.736, "args": { "External id": 14317,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418886.902, "dur": 2.498, "args": { "External id": 14318,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418890.388, "dur": 0.691, "args": { "External id": 14319,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650418892.999, "dur": 1.262, "args": { "External id": 14320,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650418911.928, "dur": 37.800, "args": { "External id": 14321,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7816 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650419020.801, "dur": 156.809, "args": { "External id": 14322,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650419034.264, "dur": 6.974, "args": { "External id": 14323,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650419046.719, "dur": 11.479, "args": { "External id": 14324,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650419051.321, "dur": 6.471, "args": { "External id": 14325,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419054.971, "dur": 1.219, "args": { "External id": 14326,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650419066.023, "dur": 32.725, "args": { "External id": 14327,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419068.466, "dur": 2.917, "args": { "External id": 14328,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419072.832, "dur": 0.754, "args": { "External id": 14329,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419074.905, "dur": 0.693, "args": { "External id": 14330,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419079.320, "dur": 0.735, "args": { "External id": 14331,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419081.474, "dur": 0.677, "args": { "External id": 14332,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419083.375, "dur": 0.738, "args": { "External id": 14333,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419088.156, "dur": 0.652, "args": { "External id": 14334,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419090.157, "dur": 0.753, "args": { "External id": 14335,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419092.336, "dur": 2.723, "args": { "External id": 14336,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650419142.555, "dur": 26.520, "args": { "External id": 14337,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7832 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650419250.919, "dur": 354.892, "args": { "External id": 14338,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7833 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650419282.440, "dur": 318.451, "args": { "External id": 14339,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7834, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650419295.670, "dur": 299.891, "args": { "External id": 14340,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7835 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650419628.263, "dur": 2.228, "args": { "External id": 14341,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7836, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.23)", "pid": 1336754, "tid": 1336754, "ts": 1295650419722.695, "dur": 17002.672, "args": { "External id": 14342,"Record function id": 0, "Ev Idx": 7837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419820.145, "dur": 6.799, "args": { "External id": 14343,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419830.833, "dur": 1.973, "args": { "External id": 14344,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419834.614, "dur": 1.485, "args": { "External id": 14345,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419838.022, "dur": 1.459, "args": { "External id": 14346,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419840.786, "dur": 1.280, "args": { "External id": 14347,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419846.163, "dur": 1.065, "args": { "External id": 14348,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419848.604, "dur": 1.525, "args": { "External id": 14349,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419852.021, "dur": 2.051, "args": { "External id": 14350,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419855.347, "dur": 1.483, "args": { "External id": 14351,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650419860.508, "dur": 1.083, "args": { "External id": 14352,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7847 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650419879.329, "dur": 16806.985, "args": { "External id": 14353,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650419895.363, "dur": 16783.897, "args": { "External id": 14354,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650419914.708, "dur": 13.253, "args": { "External id": 14355,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650419930.832, "dur": 16714.884, "args": { "External id": 14356,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650419933.216, "dur": 16711.957, "args": { "External id": 14357,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650419939.477, "dur": 6.104, "args": { "External id": 14358,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650419947.324, "dur": 16694.622, "args": { "External id": 14359,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7854 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650436856.371, "dur": 37.604, "args": { "External id": 14360,"Sequence number": 246587, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7855 } }, { "ph": "s", "id": 181, "pid": 1336754, "tid": 1336754, "ts": 1295650436856.371, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650436881.063, "dur": 8.003, "args": { "External id": 14361,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650436884.382, "dur": 4.505, "args": { "External id": 14362,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7857 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650436960.456, "dur": 120.633, "args": { "External id": 14363,"Record function id": 0, "Ev Idx": 7858 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650437084.577, "dur": 1115.784, "args": { "External id": 14364,"Record function id": 0, "Ev Idx": 7859 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650437130.063, "dur": 1056.419, "args": { "External id": 14365,"Sequence number": 246588, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7860 } }, { "ph": "s", "id": 180, "pid": 1336754, "tid": 1336754, "ts": 1295650437130.063, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650437200.751, "dur": 58.366, "args": { "External id": 14366,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437275.648, "dur": 105.626, "args": { "External id": 14367,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437391.960, "dur": 39.321, "args": { "External id": 14368,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437441.603, "dur": 31.416, "args": { "External id": 14369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7864 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650437499.864, "dur": 27.546, "args": { "External id": 14370,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7865 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650437547.046, "dur": 15.288, "args": { "External id": 14371,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7866 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650437580.384, "dur": 134.694, "args": { "External id": 14372,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650437635.547, "dur": 11.516, "args": { "External id": 14373,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650437640.341, "dur": 5.851, "args": { "External id": 14374,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650437649.710, "dur": 5.402, "args": { "External id": 14375,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650437657.032, "dur": 1.578, "args": { "External id": 14376,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650437661.048, "dur": 4.036, "args": { "External id": 14377,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437725.119, "dur": 48.488, "args": { "External id": 14378,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7873 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650437806.049, "dur": 28.807, "args": { "External id": 14379,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437844.110, "dur": 42.600, "args": { "External id": 14380,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650437897.025, "dur": 35.787, "args": { "External id": 14381,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7876 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650437956.973, "dur": 63.649, "args": { "External id": 14382,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650438029.695, "dur": 41.565, "args": { "External id": 14383,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7878 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650438094.730, "dur": 20.643, "args": { "External id": 14384,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7879 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.23)", "pid": 1336754, "tid": 1336754, "ts": 1295650438279.543, "dur": 75.746, "args": { "External id": 14385,"Record function id": 0, "Ev Idx": 7880 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650438428.459, "dur": 48.142, "args": { "External id": 14386,"Record function id": 0, "Ev Idx": 7881 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.24)", "pid": 1336754, "tid": 1336754, "ts": 1295650438485.177, "dur": 18273.599, "args": { "External id": 14387,"Record function id": 0, "Ev Idx": 7882 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.24)", "pid": 1336754, "tid": 1336754, "ts": 1295650438494.264, "dur": 922.660, "args": { "External id": 14388,"Record function id": 0, "Ev Idx": 7883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650438575.751, "dur": 9.298, "args": { "External id": 14389,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650438600.038, "dur": 40.492, "args": { "External id": 14390,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438605.779, "dur": 2.623, "args": { "External id": 14391,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438612.856, "dur": 0.951, "args": { "External id": 14392,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438615.365, "dur": 1.018, "args": { "External id": 14393,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438617.905, "dur": 0.742, "args": { "External id": 14394,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438622.151, "dur": 0.886, "args": { "External id": 14395,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438624.264, "dur": 1.140, "args": { "External id": 14396,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438626.850, "dur": 3.049, "args": { "External id": 14397,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438631.550, "dur": 0.881, "args": { "External id": 14398,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438634.117, "dur": 0.855, "args": { "External id": 14399,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650438651.514, "dur": 43.177, "args": { "External id": 14400,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7895 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650438727.193, "dur": 115.997, "args": { "External id": 14401,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650438738.205, "dur": 4.766, "args": { "External id": 14402,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650438747.852, "dur": 11.226, "args": { "External id": 14403,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650438752.343, "dur": 6.339, "args": { "External id": 14404,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438756.297, "dur": 1.179, "args": { "External id": 14405,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650438766.006, "dur": 31.668, "args": { "External id": 14406,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438768.159, "dur": 2.853, "args": { "External id": 14407,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438772.515, "dur": 0.710, "args": { "External id": 14408,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438774.621, "dur": 1.395, "args": { "External id": 14409,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438779.575, "dur": 0.871, "args": { "External id": 14410,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438781.698, "dur": 0.587, "args": { "External id": 14411,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438783.469, "dur": 0.673, "args": { "External id": 14412,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438787.414, "dur": 0.866, "args": { "External id": 14413,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438789.295, "dur": 0.820, "args": { "External id": 14414,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650438791.733, "dur": 2.282, "args": { "External id": 14415,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650438810.726, "dur": 24.823, "args": { "External id": 14416,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7911 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650438895.967, "dur": 420.265, "args": { "External id": 14417,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7912 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650438932.892, "dur": 377.181, "args": { "External id": 14418,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7913, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650438943.200, "dur": 361.199, "args": { "External id": 14419,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7914 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650439341.309, "dur": 2.459, "args": { "External id": 14420,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7915, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.24)", "pid": 1336754, "tid": 1336754, "ts": 1295650439437.028, "dur": 17131.095, "args": { "External id": 14421,"Record function id": 0, "Ev Idx": 7916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439537.264, "dur": 6.576, "args": { "External id": 14422,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439552.397, "dur": 1.581, "args": { "External id": 14423,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439555.833, "dur": 1.000, "args": { "External id": 14424,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439560.333, "dur": 0.751, "args": { "External id": 14425,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439562.244, "dur": 0.909, "args": { "External id": 14426,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439564.460, "dur": 0.998, "args": { "External id": 14427,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439567.100, "dur": 0.997, "args": { "External id": 14428,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439571.394, "dur": 2.386, "args": { "External id": 14429,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439575.609, "dur": 0.831, "args": { "External id": 14430,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650439577.877, "dur": 0.831, "args": { "External id": 14431,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 7926 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650439599.176, "dur": 16930.920, "args": { "External id": 14432,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650439615.008, "dur": 16908.176, "args": { "External id": 14433,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 7928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650439633.808, "dur": 14.324, "args": { "External id": 14434,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650439653.233, "dur": 16836.038, "args": { "External id": 14435,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 7930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650439655.506, "dur": 16833.255, "args": { "External id": 14436,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 7931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650439661.320, "dur": 6.374, "args": { "External id": 14437,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650439669.460, "dur": 16816.283, "args": { "External id": 14438,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 7933 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650456698.630, "dur": 36.500, "args": { "External id": 14439,"Sequence number": 246589, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 7934 } }, { "ph": "s", "id": 179, "pid": 1336754, "tid": 1336754, "ts": 1295650456698.630, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650456722.316, "dur": 7.772, "args": { "External id": 14440,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 7935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650456725.401, "dur": 4.441, "args": { "External id": 14441,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 7936 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650456798.382, "dur": 76.171, "args": { "External id": 14442,"Record function id": 0, "Ev Idx": 7937 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650456876.386, "dur": 1098.411, "args": { "External id": 14443,"Record function id": 0, "Ev Idx": 7938 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650456914.469, "dur": 1046.937, "args": { "External id": 14444,"Sequence number": 246590, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 7939 } }, { "ph": "s", "id": 178, "pid": 1336754, "tid": 1336754, "ts": 1295650456914.469, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650457013.723, "dur": 46.959, "args": { "External id": 14445,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457076.901, "dur": 106.236, "args": { "External id": 14446,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457192.828, "dur": 54.593, "args": { "External id": 14447,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457260.878, "dur": 35.918, "args": { "External id": 14448,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7943 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650457325.816, "dur": 26.502, "args": { "External id": 14449,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7944 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650457371.022, "dur": 17.768, "args": { "External id": 14450,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 7945 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650457406.522, "dur": 131.163, "args": { "External id": 14451,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 7946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650457457.721, "dur": 11.896, "args": { "External id": 14452,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 7947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650457462.686, "dur": 6.022, "args": { "External id": 14453,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650457472.363, "dur": 5.048, "args": { "External id": 14454,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650457478.749, "dur": 2.062, "args": { "External id": 14455,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650457483.010, "dur": 3.692, "args": { "External id": 14456,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457547.308, "dur": 48.299, "args": { "External id": 14457,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 7952 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650457627.565, "dur": 27.645, "args": { "External id": 14458,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 7953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457663.349, "dur": 42.453, "args": { "External id": 14459,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457715.233, "dur": 35.562, "args": { "External id": 14460,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 7955 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650457782.511, "dur": 29.705, "args": { "External id": 14461,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 7956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650457821.274, "dur": 34.663, "args": { "External id": 14462,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 7957 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650457876.473, "dur": 18.235, "args": { "External id": 14463,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 7958 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.24)", "pid": 1336754, "tid": 1336754, "ts": 1295650458078.127, "dur": 78.667, "args": { "External id": 14464,"Record function id": 0, "Ev Idx": 7959 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650458245.785, "dur": 51.664, "args": { "External id": 14465,"Record function id": 0, "Ev Idx": 7960 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.25)", "pid": 1336754, "tid": 1336754, "ts": 1295650458307.238, "dur": 18236.176, "args": { "External id": 14466,"Record function id": 0, "Ev Idx": 7961 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.25)", "pid": 1336754, "tid": 1336754, "ts": 1295650458315.709, "dur": 958.261, "args": { "External id": 14467,"Record function id": 0, "Ev Idx": 7962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650458398.950, "dur": 9.998, "args": { "External id": 14468,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650458423.640, "dur": 40.478, "args": { "External id": 14469,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458429.543, "dur": 2.428, "args": { "External id": 14470,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458437.037, "dur": 1.031, "args": { "External id": 14471,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458439.371, "dur": 0.993, "args": { "External id": 14472,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458442.037, "dur": 0.827, "args": { "External id": 14473,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458446.782, "dur": 0.924, "args": { "External id": 14474,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458448.654, "dur": 0.624, "args": { "External id": 14475,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458450.619, "dur": 2.928, "args": { "External id": 14476,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458454.668, "dur": 0.917, "args": { "External id": 14477,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458457.149, "dur": 0.958, "args": { "External id": 14478,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650458475.421, "dur": 45.726, "args": { "External id": 14479,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7974 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650458554.824, "dur": 116.815, "args": { "External id": 14480,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 7975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650458565.691, "dur": 4.679, "args": { "External id": 14481,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 7976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650458575.530, "dur": 10.339, "args": { "External id": 14482,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650458579.874, "dur": 5.611, "args": { "External id": 14483,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 7978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458583.249, "dur": 0.996, "args": { "External id": 14484,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 7979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650458593.144, "dur": 31.491, "args": { "External id": 14485,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 7980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458594.947, "dur": 3.452, "args": { "External id": 14486,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458599.790, "dur": 1.011, "args": { "External id": 14487,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458602.295, "dur": 0.760, "args": { "External id": 14488,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458606.811, "dur": 0.829, "args": { "External id": 14489,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458608.987, "dur": 0.650, "args": { "External id": 14490,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458610.753, "dur": 0.621, "args": { "External id": 14491,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458614.554, "dur": 0.502, "args": { "External id": 14492,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458616.114, "dur": 0.579, "args": { "External id": 14493,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650458618.121, "dur": 2.392, "args": { "External id": 14494,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 7989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650458639.100, "dur": 24.597, "args": { "External id": 14495,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 7990 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650458724.899, "dur": 433.318, "args": { "External id": 14496,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 7991 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650458755.813, "dur": 396.608, "args": { "External id": 14497,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 7992, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650458766.527, "dur": 379.050, "args": { "External id": 14498,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 7993 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650459184.762, "dur": 2.756, "args": { "External id": 14499,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 7994, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.25)", "pid": 1336754, "tid": 1336754, "ts": 1295650459297.150, "dur": 17053.086, "args": { "External id": 14500,"Record function id": 0, "Ev Idx": 7995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459403.375, "dur": 7.186, "args": { "External id": 14501,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 7996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459413.936, "dur": 1.595, "args": { "External id": 14502,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 7997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459417.185, "dur": 1.090, "args": { "External id": 14503,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459420.227, "dur": 1.157, "args": { "External id": 14504,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 7999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459422.763, "dur": 1.033, "args": { "External id": 14505,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459425.094, "dur": 1.074, "args": { "External id": 14506,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459429.942, "dur": 1.168, "args": { "External id": 14507,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459432.968, "dur": 2.446, "args": { "External id": 14508,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459436.956, "dur": 1.050, "args": { "External id": 14509,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650459439.590, "dur": 1.018, "args": { "External id": 14510,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8005 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650459461.490, "dur": 16849.442, "args": { "External id": 14511,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650459478.272, "dur": 16825.425, "args": { "External id": 14512,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650459500.875, "dur": 14.205, "args": { "External id": 14513,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650459518.043, "dur": 16752.259, "args": { "External id": 14514,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650459520.897, "dur": 16748.866, "args": { "External id": 14515,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650459527.226, "dur": 6.436, "args": { "External id": 14516,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650459535.469, "dur": 16731.194, "args": { "External id": 14517,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8012 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650476482.979, "dur": 36.236, "args": { "External id": 14518,"Sequence number": 246591, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8013 } }, { "ph": "s", "id": 177, "pid": 1336754, "tid": 1336754, "ts": 1295650476482.979, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650476499.422, "dur": 14.456, "args": { "External id": 14519,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650476509.180, "dur": 4.434, "args": { "External id": 14520,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8015 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650476583.066, "dur": 76.649, "args": { "External id": 14521,"Record function id": 0, "Ev Idx": 8016 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650476661.302, "dur": 1104.187, "args": { "External id": 14522,"Record function id": 0, "Ev Idx": 8017 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650476701.849, "dur": 1049.903, "args": { "External id": 14523,"Sequence number": 246592, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8018 } }, { "ph": "s", "id": 176, "pid": 1336754, "tid": 1336754, "ts": 1295650476701.849, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650476765.473, "dur": 43.102, "args": { "External id": 14524,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650476821.055, "dur": 103.318, "args": { "External id": 14525,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650476933.388, "dur": 38.984, "args": { "External id": 14526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650477018.487, "dur": 39.799, "args": { "External id": 14527,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8022 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650477087.824, "dur": 28.979, "args": { "External id": 14528,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8023 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650477135.814, "dur": 15.262, "args": { "External id": 14529,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8024 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650477168.080, "dur": 147.284, "args": { "External id": 14530,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650477219.007, "dur": 26.257, "args": { "External id": 14531,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650477223.489, "dur": 20.789, "args": { "External id": 14532,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650477248.806, "dur": 5.496, "args": { "External id": 14533,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650477255.595, "dur": 1.565, "args": { "External id": 14534,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650477260.121, "dur": 3.314, "args": { "External id": 14535,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650477326.592, "dur": 53.383, "args": { "External id": 14536,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8031 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650477412.992, "dur": 31.380, "args": { "External id": 14537,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650477453.130, "dur": 41.067, "args": { "External id": 14538,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650477503.449, "dur": 34.936, "args": { "External id": 14539,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8034 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650477562.831, "dur": 35.762, "args": { "External id": 14540,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650477605.134, "dur": 34.986, "args": { "External id": 14541,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8036 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650477660.265, "dur": 19.725, "args": { "External id": 14542,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8037 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.25)", "pid": 1336754, "tid": 1336754, "ts": 1295650477830.562, "dur": 73.409, "args": { "External id": 14543,"Record function id": 0, "Ev Idx": 8038 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650477975.702, "dur": 84.348, "args": { "External id": 14544,"Record function id": 0, "Ev Idx": 8039 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.26)", "pid": 1336754, "tid": 1336754, "ts": 1295650478070.610, "dur": 18249.781, "args": { "External id": 14545,"Record function id": 0, "Ev Idx": 8040 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.26)", "pid": 1336754, "tid": 1336754, "ts": 1295650478080.549, "dur": 874.599, "args": { "External id": 14546,"Record function id": 0, "Ev Idx": 8041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650478162.965, "dur": 9.800, "args": { "External id": 14547,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650478187.042, "dur": 38.484, "args": { "External id": 14548,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478192.768, "dur": 2.545, "args": { "External id": 14549,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478200.020, "dur": 0.994, "args": { "External id": 14550,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478202.234, "dur": 0.578, "args": { "External id": 14551,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478204.808, "dur": 0.607, "args": { "External id": 14552,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478208.633, "dur": 0.813, "args": { "External id": 14553,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478210.760, "dur": 0.864, "args": { "External id": 14554,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478212.614, "dur": 2.778, "args": { "External id": 14555,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478216.837, "dur": 0.892, "args": { "External id": 14556,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478218.945, "dur": 0.609, "args": { "External id": 14557,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650478253.224, "dur": 47.301, "args": { "External id": 14558,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8053 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650478335.406, "dur": 123.998, "args": { "External id": 14559,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650478346.923, "dur": 5.967, "args": { "External id": 14560,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650478358.176, "dur": 11.036, "args": { "External id": 14561,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650478362.725, "dur": 6.060, "args": { "External id": 14562,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478366.458, "dur": 0.913, "args": { "External id": 14563,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650478376.643, "dur": 35.522, "args": { "External id": 14564,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478379.095, "dur": 2.534, "args": { "External id": 14565,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478383.167, "dur": 0.886, "args": { "External id": 14566,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478388.899, "dur": 0.728, "args": { "External id": 14567,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478392.672, "dur": 0.829, "args": { "External id": 14568,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478394.743, "dur": 0.645, "args": { "External id": 14569,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478397.114, "dur": 2.560, "args": { "External id": 14570,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478400.689, "dur": 0.924, "args": { "External id": 14571,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478403.056, "dur": 0.695, "args": { "External id": 14572,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650478407.403, "dur": 0.734, "args": { "External id": 14573,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650478426.946, "dur": 24.893, "args": { "External id": 14574,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8069 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650478514.643, "dur": 351.847, "args": { "External id": 14575,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8070 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650478545.771, "dur": 316.211, "args": { "External id": 14576,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8071, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650478556.354, "dur": 300.119, "args": { "External id": 14577,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8072 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650478887.975, "dur": 2.007, "args": { "External id": 14578,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8073, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.26)", "pid": 1336754, "tid": 1336754, "ts": 1295650478975.321, "dur": 17121.978, "args": { "External id": 14579,"Record function id": 0, "Ev Idx": 8074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479119.840, "dur": 6.718, "args": { "External id": 14580,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479130.134, "dur": 1.800, "args": { "External id": 14581,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479140.577, "dur": 1.257, "args": { "External id": 14582,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479145.528, "dur": 1.009, "args": { "External id": 14583,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479148.103, "dur": 1.130, "args": { "External id": 14584,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479150.647, "dur": 1.441, "args": { "External id": 14585,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479154.160, "dur": 1.076, "args": { "External id": 14586,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479158.595, "dur": 1.898, "args": { "External id": 14587,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479162.125, "dur": 1.262, "args": { "External id": 14588,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650479164.937, "dur": 0.904, "args": { "External id": 14589,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8084 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650479186.892, "dur": 16870.847, "args": { "External id": 14590,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650479202.894, "dur": 16847.865, "args": { "External id": 14591,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650479221.461, "dur": 27.244, "args": { "External id": 14592,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650479255.114, "dur": 16761.004, "args": { "External id": 14593,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650479257.834, "dur": 16757.791, "args": { "External id": 14594,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650479264.384, "dur": 6.148, "args": { "External id": 14595,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650479272.419, "dur": 16740.202, "args": { "External id": 14596,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8091 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650496242.194, "dur": 39.418, "args": { "External id": 14597,"Sequence number": 246593, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8092 } }, { "ph": "s", "id": 175, "pid": 1336754, "tid": 1336754, "ts": 1295650496242.194, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650496267.632, "dur": 8.567, "args": { "External id": 14598,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650496271.016, "dur": 4.779, "args": { "External id": 14599,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8094 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650496361.484, "dur": 77.817, "args": { "External id": 14600,"Record function id": 0, "Ev Idx": 8095 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650496440.977, "dur": 1122.414, "args": { "External id": 14601,"Record function id": 0, "Ev Idx": 8096 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650496482.416, "dur": 1066.830, "args": { "External id": 14602,"Sequence number": 246594, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8097 } }, { "ph": "s", "id": 174, "pid": 1336754, "tid": 1336754, "ts": 1295650496482.416, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650496552.173, "dur": 43.843, "args": { "External id": 14603,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650496609.945, "dur": 103.976, "args": { "External id": 14604,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650496723.321, "dur": 40.184, "args": { "External id": 14605,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650496773.634, "dur": 32.153, "args": { "External id": 14606,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8101 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650496829.375, "dur": 31.658, "args": { "External id": 14607,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8102 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650496882.746, "dur": 16.740, "args": { "External id": 14608,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8103 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650496916.133, "dur": 172.895, "args": { "External id": 14609,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650496966.427, "dur": 11.725, "args": { "External id": 14610,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650496971.174, "dur": 6.185, "args": { "External id": 14611,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650496980.654, "dur": 43.060, "args": { "External id": 14612,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650497026.623, "dur": 1.742, "args": { "External id": 14613,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650497030.812, "dur": 3.698, "args": { "External id": 14614,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650497100.719, "dur": 52.054, "args": { "External id": 14615,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8110 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650497187.001, "dur": 29.818, "args": { "External id": 14616,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650497225.724, "dur": 62.575, "args": { "External id": 14617,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650497301.249, "dur": 36.832, "args": { "External id": 14618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8113 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650497361.853, "dur": 29.751, "args": { "External id": 14619,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650497398.116, "dur": 34.954, "args": { "External id": 14620,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8115 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650497454.779, "dur": 23.403, "args": { "External id": 14621,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8116 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.26)", "pid": 1336754, "tid": 1336754, "ts": 1295650497627.613, "dur": 72.956, "args": { "External id": 14622,"Record function id": 0, "Ev Idx": 8117 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::cast_forward_inputs", "pid": 1336754, "tid": 1336754, "ts": 1295650497773.407, "dur": 46.737, "args": { "External id": 14623,"Record function id": 0, "Ev Idx": 8118 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::pre_forward (model.layers.27)", "pid": 1336754, "tid": 1336754, "ts": 1295650497829.086, "dur": 18293.848, "args": { "External id": 14624,"Record function id": 0, "Ev Idx": 8119 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather (model.layers.27)", "pid": 1336754, "tid": 1336754, "ts": 1295650497838.760, "dur": 911.212, "args": { "External id": 14625,"Record function id": 0, "Ev Idx": 8120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650497920.900, "dur": 8.930, "args": { "External id": 14626,"Record function id": 0, "Concrete Inputs": ["[6423040]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650497943.492, "dur": 78.076, "args": { "External id": 14627,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497949.097, "dur": 2.414, "args": { "External id": 14628,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497955.878, "dur": 0.680, "args": { "External id": 14629,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "256"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497958.308, "dur": 0.642, "args": { "External id": 14630,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "524544"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497960.505, "dur": 0.813, "args": { "External id": 14631,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1048832"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497964.667, "dur": 0.603, "args": { "External id": 14632,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "1573120"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497966.737, "dur": 0.990, "args": { "External id": 14633,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "2097408"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497969.292, "dur": 2.733, "args": { "External id": 14634,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "2097664"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497973.645, "dur": 0.631, "args": { "External id": 14635,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "3539456"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650497975.590, "dur": 0.909, "args": { "External id": 14636,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "4981248"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650498035.679, "dur": 45.583, "args": { "External id": 14637,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8132 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::all_gather_copy_in", "pid": 1336754, "tid": 1336754, "ts": 1295650498116.723, "dur": 139.980, "args": { "External id": 14638,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "6423040", "8", "1", "15", ""], "Input type": ["TensorList", "ScalarList", "Scalar", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [], [], [], [], [], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [], [], [], [], [], []], "Ev Idx": 8133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650498128.281, "dur": 5.629, "args": { "External id": 14639,"Record function id": 0, "Concrete Inputs": ["[51384320]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::narrow", "pid": 1336754, "tid": 1336754, "ts": 1295650498139.042, "dur": 11.161, "args": { "External id": 14640,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "6423040"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650498143.635, "dur": 6.166, "args": { "External id": 14641,"Record function id": 0, "Concrete Inputs": ["", "0", "6423040", "12846080", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[51384320], [], [], [], []], "Ev Idx": 8136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498147.337, "dur": 1.244, "args": { "External id": 14642,"Record function id": 0, "Concrete Inputs": ["", "[6423040]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[51384320], [], [], []], "Ev Idx": 8137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes", "pid": 1336754, "tid": 1336754, "ts": 1295650498157.237, "dur": 33.362, "args": { "External id": 14643,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[6423040], [], []], "Ev Idx": 8138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498159.377, "dur": 2.776, "args": { "External id": 14644,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "6423040"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498164.006, "dur": 0.703, "args": { "External id": 14645,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6423296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498166.067, "dur": 1.105, "args": { "External id": 14646,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "6947584"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498170.540, "dur": 1.095, "args": { "External id": 14647,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7471872"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498173.063, "dur": 0.962, "args": { "External id": 14648,"Record function id": 0, "Concrete Inputs": ["", "[524288]", "[1]", "7996160"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498175.439, "dur": 0.880, "args": { "External id": 14649,"Record function id": 0, "Concrete Inputs": ["", "[256]", "[1]", "8520448"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498179.531, "dur": 0.937, "args": { "External id": 14650,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "8520704"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498181.663, "dur": 0.699, "args": { "External id": 14651,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "9962496"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650498183.737, "dur": 2.358, "args": { "External id": 14652,"Record function id": 0, "Concrete Inputs": ["", "[1441792]", "[1]", "11404288"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[6423040], [], [], []], "Ev Idx": 8147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650498206.787, "dur": 40.123, "args": { "External id": 14653,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["TensorList", "TensorList", "Scalar"], "Input Strides": [[[1], [1], [1], [1], [1], [1], [1], [1], [1]], [[1], [1], [1], [1], [1], [1], [1], [1], [1]], []], "Input Dims": [[[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], [[256], [524288], [524288], [524288], [524288], [256], [1441792], [1441792], [1441792]], []], "Ev Idx": 8148 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::_allgather_base_", "pid": 1336754, "tid": 1336754, "ts": 1295650498312.337, "dur": 348.448, "args": { "External id": 14654,"Record function id": 0, "Concrete Inputs": ["", "", "", "False", "-1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "Scalar", "Scalar"], "Input Strides": [[1], [1], [], [], []], "Input Dims": [[51384320], [6423040], [], [], []], "Ev Idx": 8149 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650498341.668, "dur": 314.901, "args": { "External id": 14655,"Record function id": 0, "Collective name": "_allgather_base", "Process Group Description": "default_pg", "dtype": "BFloat16", "Rank": 1, "Input Strides": [[1], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 51384320, "Process Group Name": "0", "Input type": ["c10::BFloat16", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[6423040], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 8150, "In msg nelems": 6423040 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:_all_gather_base", "pid": 1336754, "tid": 1336754, "ts": 1295650498351.871, "dur": 299.139, "args": { "External id": 14656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[1]], "Input Dims": [[6423040]], "Ev Idx": 8151 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295650498682.511, "dur": 2.221, "args": { "External id": 14657,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 8152, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::all_gather_copy_out (model.layers.27)", "pid": 1336754, "tid": 1336754, "ts": 1295650498769.564, "dur": 17125.476, "args": { "External id": 14658,"Record function id": 0, "Ev Idx": 8153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498879.276, "dur": 6.215, "args": { "External id": 14659,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[51384320], []], "Ev Idx": 8154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498889.154, "dur": 1.509, "args": { "External id": 14660,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498892.330, "dur": 1.169, "args": { "External id": 14661,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498897.606, "dur": 1.150, "args": { "External id": 14662,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498900.137, "dur": 1.301, "args": { "External id": 14663,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498902.674, "dur": 1.416, "args": { "External id": 14664,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[4194304], []], "Ev Idx": 8159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498906.027, "dur": 1.130, "args": { "External id": 14665,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[2048], []], "Ev Idx": 8160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498910.317, "dur": 2.239, "args": { "External id": 14666,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498914.096, "dur": 1.027, "args": { "External id": 14667,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650498916.417, "dur": 0.912, "args": { "External id": 14668,"Record function id": 0, "Concrete Inputs": ["", "[8, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[11534336], []], "Ev Idx": 8163 } }, { "ph": "X", "cat": "cpu_op", "name": "fsdp::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650498936.765, "dur": 16918.552, "args": { "External id": 14669,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::split_with_sizes_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650498952.372, "dur": 16895.961, "args": { "External id": 14670,"Record function id": 0, "Concrete Inputs": ["", "[256, 524288, 524288, 524288, 524288, 256, 1441792, 1441792, 1441792]", "1", ""], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "TensorList"], "Input Strides": [[6423040, 1], [], [], [[256, 1], [524288, 1], [524288, 1], [524288, 1], [524288, 1], [256, 1], [1441792, 1], [1441792, 1], [1441792, 1]]], "Input Dims": [[8, 6423040], [], [], [[8, 256], [8, 524288], [8, 524288], [8, 524288], [8, 524288], [8, 256], [8, 1441792], [8, 1441792], [8, 1441792]]], "Ev Idx": 8165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650498970.122, "dur": 52.657, "args": { "External id": 14671,"Record function id": 0, "Concrete Inputs": ["[2133]", "4", "", "", "True", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650499028.683, "dur": 16784.303, "args": { "External id": 14672,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", "False", ""], "Input type": ["long int", "", "", "", "", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], [], []], "Ev Idx": 8167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650499031.325, "dur": 16780.957, "args": { "External id": 14673,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "True", ""], "Input type": ["long int", "", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[2133], [], [], [], [], [], []], "Ev Idx": 8168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650499037.362, "dur": 7.096, "args": { "External id": 14674,"Record function id": 0, "Concrete Inputs": ["[2133]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650499046.006, "dur": 16763.122, "args": { "External id": 14675,"Record function id": 0, "Concrete Inputs": ["", "", "True"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[2133], [2133], []], "Ev Idx": 8170 } }, { "ph": "X", "cat": "cpu_op", "name": "RegisterPostBackwardFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650516055.265, "dur": 42.699, "args": { "External id": 14676,"Sequence number": 246595, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048]], "Ev Idx": 8171 } }, { "ph": "s", "id": 173, "pid": 1336754, "tid": 1336754, "ts": 1295650516055.265, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295650516084.105, "dur": 8.470, "args": { "External id": 14677,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1]], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048]], "Ev Idx": 8172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650516087.442, "dur": 4.769, "args": { "External id": 14678,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8173 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650516162.138, "dur": 89.434, "args": { "External id": 14679,"Record function id": 0, "Ev Idx": 8174 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 1/1", "pid": 1336754, "tid": 1336754, "ts": 1295650516254.544, "dur": 1118.084, "args": { "External id": 14680,"Record function id": 0, "Ev Idx": 8175 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650516295.096, "dur": 1064.066, "args": { "External id": 14681,"Sequence number": 246596, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "", "", "", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1], [2048, 1], [2048, 1], [2048, 1], [32, 1], [32, 1], [2048, 1], [1], [2048, 1], [2048, 1], [5632, 1]], "Input Dims": [[16, 4096, 2048], [2048], [2048, 2048], [2048, 2048], [2048, 2048], [8192, 32], [8192, 32], [2048, 2048], [2048], [5632, 2048], [5632, 2048], [2048, 5632]], "Ev Idx": 8176 } }, { "ph": "s", "id": 172, "pid": 1336754, "tid": 1336754, "ts": 1295650516295.096, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650516365.058, "dur": 46.822, "args": { "External id": 14682,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650516425.673, "dur": 106.900, "args": { "External id": 14683,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650516542.141, "dur": 43.629, "args": { "External id": 14684,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650516595.691, "dur": 31.558, "args": { "External id": 14685,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8180 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650516653.194, "dur": 29.304, "args": { "External id": 14686,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8181 } }, { "ph": "X", "cat": "cpu_op", "name": "rotary_embedding_kernel_1", "pid": 1336754, "tid": 1336754, "ts": 1295650516700.383, "dur": 16.073, "args": { "External id": 14687,"kernel_hash": "cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "0", "16", "4096", "32", "64", "32", "8192", "32", "64", "False", "False", "False", "False"], "kernel_file": "/tmp/torchinductor_cvm/vf/cvfmx3dtueggejegez27w222l5wve5udft5w5bpqit5metyl3lao.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 8182 } }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650516733.851, "dur": 131.838, "args": { "External id": 14688,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650516787.612, "dur": 12.227, "args": { "External id": 14689,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650516792.597, "dur": 6.456, "args": { "External id": 14690,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650516802.911, "dur": 5.393, "args": { "External id": 14691,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650516809.662, "dur": 1.685, "args": { "External id": 14692,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650516813.692, "dur": 2.875, "args": { "External id": 14693,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650516876.048, "dur": 47.215, "args": { "External id": 14694,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [2048, 1]], "Input Dims": [[65536, 2048], [2048, 2048], [65536, 2048]], "Ev Idx": 8189 } }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_2", "pid": 1336754, "tid": 1336754, "ts": 1295650516955.306, "dur": 65.379, "args": { "External id": 14695,"kernel_hash": "cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "True", "True", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/wx/cwxmlnjvnrmqdfwpkx5pm5ox5uexmxff6wgrjt6ou3pvccpt3bci.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [2048, 1], [2048, 1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536, 2048], [2048], [65536, 2048], [65536, 2048], [65536], [], [], [], [], [], [], [], [], []], "Ev Idx": 8190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650517034.307, "dur": 49.224, "args": { "External id": 14696,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650517093.304, "dur": 37.267, "args": { "External id": 14697,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048], [5632, 1]], "Input Dims": [[65536, 2048], [2048, 5632], [65536, 5632]], "Ev Idx": 8192 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused__to_copy_mul_silu_0", "pid": 1336754, "tid": 1336754, "ts": 1295650517157.180, "dur": 28.731, "args": { "External id": 14698,"kernel_hash": "c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43", "grid": "grid(369098752,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "369098752"], "kernel_file": "/tmp/torchinductor_cvm/2f/c2fsjwk3nwbfke7oj7nq5k7qop6mvatbrirsxktytkvp2mdmme43.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[5632, 1], [5632, 1], [23068672, 5632, 1], []], "Input Dims": [[65536, 5632], [65536, 5632], [16, 4096, 5632], []], "Ev Idx": 8193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650517191.742, "dur": 35.499, "args": { "External id": 14699,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632], [2048, 1]], "Input Dims": [[65536, 5632], [5632, 2048], [65536, 2048]], "Ev Idx": 8194 } }, { "ph": "X", "cat": "cpu_op", "name": "triton_poi_fused_add_1", "pid": 1336754, "tid": 1336754, "ts": 1295650517265.766, "dur": 21.918, "args": { "External id": 14700,"kernel_hash": "cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb", "grid": "grid(134217728,)", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "134217728"], "kernel_file": "/tmp/torchinductor_cvm/gi/cgik4ktlpri5iod5s5ynrzau3qlffebgfpe6sdr2lepxbydsdryb.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [65536, 2048], []], "Ev Idx": 8195 } }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward (model.layers.27)", "pid": 1336754, "tid": 1336754, "ts": 1295650517436.758, "dur": 33.822, "args": { "External id": 14701,"Record function id": 0, "Ev Idx": 8196 } }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650517610.676, "dur": 280.602, "args": { "External id": 14702,"Sequence number": 246597, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8197 } }, { "ph": "s", "id": 171, "pid": 1336754, "tid": 1336754, "ts": 1295650517610.676, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650517642.425, "dur": 8.640, "args": { "External id": 14703,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650517644.774, "dur": 6.017, "args": { "External id": 14704,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650517661.295, "dur": 13.230, "args": { "External id": 14705,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650517665.033, "dur": 8.883, "args": { "External id": 14706,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650517683.482, "dur": 5.553, "args": { "External id": 14707,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650517872.885, "dur": 6.165, "args": { "External id": 14708,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650517876.281, "dur": 2.555, "args": { "External id": 14709,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650517921.229, "dur": 179.166, "args": { "External id": 14710,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650517924.678, "dur": 15.879, "args": { "External id": 14711,"Sequence number": 246598, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8206 } }, { "ph": "s", "id": 170, "pid": 1336754, "tid": 1336754, "ts": 1295650517924.678, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650517930.057, "dur": 8.550, "args": { "External id": 14712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650517935.777, "dur": 2.479, "args": { "External id": 14713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650517943.428, "dur": 156.640, "args": { "External id": 14714,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650517945.986, "dur": 4.419, "args": { "External id": 14715,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650517946.801, "dur": 3.441, "args": { "External id": 14716,"Sequence number": 246599, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8211 } }, { "ph": "s", "id": 169, "pid": 1336754, "tid": 1336754, "ts": 1295650517946.801, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650517954.394, "dur": 135.121, "args": { "External id": 14717,"Sequence number": 246600, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8212 } }, { "ph": "s", "id": 168, "pid": 1336754, "tid": 1336754, "ts": 1295650517954.394, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650518094.058, "dur": 4.946, "args": { "External id": 14718,"Sequence number": 246601, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8213 } }, { "ph": "s", "id": 167, "pid": 1336754, "tid": 1336754, "ts": 1295650518094.058, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650518113.821, "dur": 75.249, "args": { "External id": 14719,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650518115.122, "dur": 9.459, "args": { "External id": 14720,"Sequence number": 246602, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8215 } }, { "ph": "s", "id": 166, "pid": 1336754, "tid": 1336754, "ts": 1295650518115.122, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650518117.599, "dur": 5.641, "args": { "External id": 14721,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518121.498, "dur": 1.393, "args": { "External id": 14722,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650518125.365, "dur": 63.413, "args": { "External id": 14723,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518126.744, "dur": 6.123, "args": { "External id": 14724,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518127.404, "dur": 5.280, "args": { "External id": 14725,"Sequence number": 246603, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8220 } }, { "ph": "s", "id": 165, "pid": 1336754, "tid": 1336754, "ts": 1295650518127.404, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650518133.572, "dur": 47.718, "args": { "External id": 14726,"Sequence number": 246604, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8221 } }, { "ph": "s", "id": 164, "pid": 1336754, "tid": 1336754, "ts": 1295650518133.572, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650518183.266, "dur": 5.135, "args": { "External id": 14727,"Sequence number": 246605, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8222 } }, { "ph": "s", "id": 163, "pid": 1336754, "tid": 1336754, "ts": 1295650518183.266, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650518197.445, "dur": 102.848, "args": { "External id": 14728,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650518198.302, "dur": 6.269, "args": { "External id": 14729,"Sequence number": 246606, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8224 } }, { "ph": "s", "id": 162, "pid": 1336754, "tid": 1336754, "ts": 1295650518198.302, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650518200.622, "dur": 2.623, "args": { "External id": 14730,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518202.048, "dur": 0.913, "args": { "External id": 14731,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650518207.332, "dur": 92.642, "args": { "External id": 14732,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518208.533, "dur": 5.528, "args": { "External id": 14733,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518209.613, "dur": 4.308, "args": { "External id": 14734,"Sequence number": 246607, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8229 } }, { "ph": "s", "id": 161, "pid": 1336754, "tid": 1336754, "ts": 1295650518209.613, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650518214.561, "dur": 74.399, "args": { "External id": 14735,"Sequence number": 246608, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8230 } }, { "ph": "s", "id": 160, "pid": 1336754, "tid": 1336754, "ts": 1295650518214.561, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650518292.122, "dur": 7.353, "args": { "External id": 14736,"Sequence number": 246609, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8231 } }, { "ph": "s", "id": 159, "pid": 1336754, "tid": 1336754, "ts": 1295650518292.122, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518324.236, "dur": 5.155, "args": { "External id": 14737,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518325.896, "dur": 3.365, "args": { "External id": 14738,"Sequence number": 246610, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8233 } }, { "ph": "s", "id": 158, "pid": 1336754, "tid": 1336754, "ts": 1295650518325.896, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518336.075, "dur": 3.696, "args": { "External id": 14739,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518337.477, "dur": 2.163, "args": { "External id": 14740,"Sequence number": 246611, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8235 } }, { "ph": "s", "id": 157, "pid": 1336754, "tid": 1336754, "ts": 1295650518337.477, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518346.202, "dur": 6.023, "args": { "External id": 14741,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518347.637, "dur": 4.455, "args": { "External id": 14742,"Sequence number": 246612, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8237 } }, { "ph": "s", "id": 156, "pid": 1336754, "tid": 1336754, "ts": 1295650518347.637, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650518392.192, "dur": 190.417, "args": { "External id": 14743,"Sequence number": 246613, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8238 } }, { "ph": "s", "id": 155, "pid": 1336754, "tid": 1336754, "ts": 1295650518392.192, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650518416.959, "dur": 10.548, "args": { "External id": 14744,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518420.330, "dur": 6.740, "args": { "External id": 14745,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8240 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650518594.867, "dur": 112.181, "args": { "External id": 14746,"Sequence number": 246614, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8241 } }, { "ph": "s", "id": 154, "pid": 1336754, "tid": 1336754, "ts": 1295650518594.867, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650518610.255, "dur": 7.133, "args": { "External id": 14747,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518612.760, "dur": 4.303, "args": { "External id": 14748,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8243 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336754, "tid": 1336754, "ts": 1295650518736.271, "dur": 193.920, "args": { "External id": 14749,"Sequence number": 246615, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8244 } }, { "ph": "s", "id": 153, "pid": 1336754, "tid": 1336754, "ts": 1295650518736.271, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650518766.002, "dur": 133.886, "args": { "External id": 14750,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650518819.267, "dur": 7.211, "args": { "External id": 14751,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518821.962, "dur": 4.096, "args": { "External id": 14752,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650518829.043, "dur": 4.808, "args": { "External id": 14753,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650518835.267, "dur": 1.801, "args": { "External id": 14754,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650518841.840, "dur": 3.157, "args": { "External id": 14755,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1336754, "ts": 1295650518915.444, "dur": 5.425, "args": { "External id": 14756,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518935.433, "dur": 5.573, "args": { "External id": 14757,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518936.958, "dur": 3.869, "args": { "External id": 14758,"Sequence number": 246616, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8253 } }, { "ph": "s", "id": 152, "pid": 1336754, "tid": 1336754, "ts": 1295650518936.958, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650518957.815, "dur": 175.872, "args": { "External id": 14759,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650518961.043, "dur": 9.126, "args": { "External id": 14760,"Sequence number": 246617, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8255 } }, { "ph": "s", "id": 151, "pid": 1336754, "tid": 1336754, "ts": 1295650518961.043, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650518964.232, "dur": 5.044, "args": { "External id": 14761,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650518967.177, "dur": 1.729, "args": { "External id": 14762,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650518971.519, "dur": 161.802, "args": { "External id": 14763,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650518973.896, "dur": 60.255, "args": { "External id": 14764,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650518977.097, "dur": 56.569, "args": { "External id": 14765,"Sequence number": 246618, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8260 } }, { "ph": "s", "id": 150, "pid": 1336754, "tid": 1336754, "ts": 1295650518977.097, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650519036.255, "dur": 87.205, "args": { "External id": 14766,"Sequence number": 246619, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8261 } }, { "ph": "s", "id": 149, "pid": 1336754, "tid": 1336754, "ts": 1295650519036.255, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650519125.936, "dur": 6.469, "args": { "External id": 14767,"Sequence number": 246620, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8262 } }, { "ph": "s", "id": 148, "pid": 1336754, "tid": 1336754, "ts": 1295650519125.936, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650519172.985, "dur": 259.225, "args": { "External id": 14768,"Sequence number": 246621, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8263 } }, { "ph": "s", "id": 147, "pid": 1336754, "tid": 1336754, "ts": 1295650519172.985, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519195.463, "dur": 3.573, "args": { "External id": 14769,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519196.704, "dur": 2.187, "args": { "External id": 14770,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336754, "tid": 1336754, "ts": 1295650519203.733, "dur": 3.347, "args": { "External id": 14771,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519204.973, "dur": 1.986, "args": { "External id": 14772,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519205.602, "dur": 1.224, "args": { "External id": 14773,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650519215.329, "dur": 10.314, "args": { "External id": 14774,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650519219.454, "dur": 5.917, "args": { "External id": 14775,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650519248.583, "dur": 4.804, "args": { "External id": 14776,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650519257.439, "dur": 3.448, "args": { "External id": 14777,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519405.540, "dur": 3.839, "args": { "External id": 14778,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519406.731, "dur": 2.428, "args": { "External id": 14779,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519412.207, "dur": 2.778, "args": { "External id": 14780,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519413.548, "dur": 1.320, "args": { "External id": 14781,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650519455.638, "dur": 107.491, "args": { "External id": 14782,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650519457.149, "dur": 8.800, "args": { "External id": 14783,"Sequence number": 246622, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8278 } }, { "ph": "s", "id": 146, "pid": 1336754, "tid": 1336754, "ts": 1295650519457.149, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650519460.401, "dur": 4.369, "args": { "External id": 14784,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650519462.839, "dur": 1.614, "args": { "External id": 14785,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650519467.189, "dur": 95.627, "args": { "External id": 14786,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519470.914, "dur": 4.534, "args": { "External id": 14787,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519471.979, "dur": 3.328, "args": { "External id": 14788,"Sequence number": 246623, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8283 } }, { "ph": "s", "id": 145, "pid": 1336754, "tid": 1336754, "ts": 1295650519471.979, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650519476.211, "dur": 80.246, "args": { "External id": 14789,"Sequence number": 246624, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8284 } }, { "ph": "s", "id": 144, "pid": 1336754, "tid": 1336754, "ts": 1295650519476.211, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650519558.531, "dur": 3.624, "args": { "External id": 14790,"Sequence number": 246625, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8285 } }, { "ph": "s", "id": 143, "pid": 1336754, "tid": 1336754, "ts": 1295650519558.531, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650519572.228, "dur": 77.250, "args": { "External id": 14791,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650519574.946, "dur": 7.191, "args": { "External id": 14792,"Sequence number": 246626, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8287 } }, { "ph": "s", "id": 142, "pid": 1336754, "tid": 1336754, "ts": 1295650519574.946, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650519577.471, "dur": 3.255, "args": { "External id": 14793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650519579.457, "dur": 1.125, "args": { "External id": 14794,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650519582.946, "dur": 66.272, "args": { "External id": 14795,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519583.782, "dur": 8.906, "args": { "External id": 14796,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519586.630, "dur": 5.881, "args": { "External id": 14797,"Sequence number": 246627, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8292 } }, { "ph": "s", "id": 141, "pid": 1336754, "tid": 1336754, "ts": 1295650519586.630, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650519593.369, "dur": 48.117, "args": { "External id": 14798,"Sequence number": 246628, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8293 } }, { "ph": "s", "id": 140, "pid": 1336754, "tid": 1336754, "ts": 1295650519593.369, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650519643.179, "dur": 5.687, "args": { "External id": 14799,"Sequence number": 246629, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8294 } }, { "ph": "s", "id": 139, "pid": 1336754, "tid": 1336754, "ts": 1295650519643.179, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650519672.828, "dur": 158.996, "args": { "External id": 14800,"Sequence number": 246630, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8295 } }, { "ph": "s", "id": 138, "pid": 1336754, "tid": 1336754, "ts": 1295650519672.828, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650519717.577, "dur": 4.644, "args": { "External id": 14801,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650519757.359, "dur": 60.280, "args": { "External id": 14802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650519758.302, "dur": 4.766, "args": { "External id": 14803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650519759.320, "dur": 2.905, "args": { "External id": 14804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650519761.065, "dur": 0.943, "args": { "External id": 14805,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650519763.938, "dur": 53.439, "args": { "External id": 14806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519767.805, "dur": 2.160, "args": { "External id": 14807,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519768.338, "dur": 1.475, "args": { "External id": 14808,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650519770.885, "dur": 42.752, "args": { "External id": 14809,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650519815.565, "dur": 1.184, "args": { "External id": 14810,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295650519841.492, "dur": 29.779, "args": { "External id": 14811,"Sequence number": 246631, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8306 } }, { "ph": "s", "id": 137, "pid": 1336754, "tid": 1336754, "ts": 1295650519841.492, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650519905.749, "dur": 235.457, "args": { "External id": 14812,"Sequence number": 246632, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8307 } }, { "ph": "s", "id": 136, "pid": 1336754, "tid": 1336754, "ts": 1295650519905.749, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650519927.585, "dur": 5.443, "args": { "External id": 14813,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650519930.869, "dur": 1.881, "args": { "External id": 14814,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650519940.670, "dur": 8.466, "args": { "External id": 14815,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650519943.403, "dur": 5.413, "args": { "External id": 14816,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650519954.572, "dur": 3.691, "args": { "External id": 14817,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520122.134, "dur": 4.348, "args": { "External id": 14818,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520123.234, "dur": 2.924, "args": { "External id": 14819,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650520161.963, "dur": 116.679, "args": { "External id": 14820,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650520163.093, "dur": 9.862, "args": { "External id": 14821,"Sequence number": 246633, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8316 } }, { "ph": "s", "id": 135, "pid": 1336754, "tid": 1336754, "ts": 1295650520163.093, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650520167.856, "dur": 3.814, "args": { "External id": 14822,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520169.896, "dur": 1.494, "args": { "External id": 14823,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650520174.299, "dur": 104.101, "args": { "External id": 14824,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520176.122, "dur": 6.447, "args": { "External id": 14825,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520179.533, "dur": 2.902, "args": { "External id": 14826,"Sequence number": 246634, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8321 } }, { "ph": "s", "id": 134, "pid": 1336754, "tid": 1336754, "ts": 1295650520179.533, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650520183.470, "dur": 87.339, "args": { "External id": 14827,"Sequence number": 246635, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8322 } }, { "ph": "s", "id": 133, "pid": 1336754, "tid": 1336754, "ts": 1295650520183.470, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650520274.023, "dur": 3.479, "args": { "External id": 14828,"Sequence number": 246636, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8323 } }, { "ph": "s", "id": 132, "pid": 1336754, "tid": 1336754, "ts": 1295650520274.023, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650520288.643, "dur": 77.066, "args": { "External id": 14829,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650520289.570, "dur": 12.218, "args": { "External id": 14830,"Sequence number": 246637, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8325 } }, { "ph": "s", "id": 131, "pid": 1336754, "tid": 1336754, "ts": 1295650520289.570, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650520297.603, "dur": 3.088, "args": { "External id": 14831,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520299.607, "dur": 0.910, "args": { "External id": 14832,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650520302.653, "dur": 62.873, "args": { "External id": 14833,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520304.272, "dur": 5.213, "args": { "External id": 14834,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520305.235, "dur": 4.110, "args": { "External id": 14835,"Sequence number": 246638, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8330 } }, { "ph": "s", "id": 130, "pid": 1336754, "tid": 1336754, "ts": 1295650520305.235, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650520310.007, "dur": 50.925, "args": { "External id": 14836,"Sequence number": 246639, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8331 } }, { "ph": "s", "id": 129, "pid": 1336754, "tid": 1336754, "ts": 1295650520310.007, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650520362.637, "dur": 2.563, "args": { "External id": 14837,"Sequence number": 246640, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8332 } }, { "ph": "s", "id": 128, "pid": 1336754, "tid": 1336754, "ts": 1295650520362.637, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650520373.890, "dur": 66.005, "args": { "External id": 14838,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650520374.450, "dur": 11.093, "args": { "External id": 14839,"Sequence number": 246641, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8334 } }, { "ph": "s", "id": 127, "pid": 1336754, "tid": 1336754, "ts": 1295650520374.450, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650520377.067, "dur": 7.185, "args": { "External id": 14840,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520380.717, "dur": 3.320, "args": { "External id": 14841,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650520386.272, "dur": 53.435, "args": { "External id": 14842,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520387.202, "dur": 4.507, "args": { "External id": 14843,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520388.112, "dur": 3.465, "args": { "External id": 14844,"Sequence number": 246642, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8339 } }, { "ph": "s", "id": 126, "pid": 1336754, "tid": 1336754, "ts": 1295650520388.112, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650520394.068, "dur": 38.148, "args": { "External id": 14845,"Sequence number": 246643, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8340 } }, { "ph": "s", "id": 125, "pid": 1336754, "tid": 1336754, "ts": 1295650520394.068, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650520434.228, "dur": 5.152, "args": { "External id": 14846,"Sequence number": 246644, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8341 } }, { "ph": "s", "id": 124, "pid": 1336754, "tid": 1336754, "ts": 1295650520434.228, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520456.001, "dur": 5.357, "args": { "External id": 14847,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520457.417, "dur": 3.805, "args": { "External id": 14848,"Sequence number": 246645, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8343 } }, { "ph": "s", "id": 123, "pid": 1336754, "tid": 1336754, "ts": 1295650520457.417, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520494.421, "dur": 8.176, "args": { "External id": 14849,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520498.019, "dur": 4.462, "args": { "External id": 14850,"Sequence number": 246646, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8345 } }, { "ph": "s", "id": 122, "pid": 1336754, "tid": 1336754, "ts": 1295650520498.019, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650520506.690, "dur": 5.006, "args": { "External id": 14851,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650520507.652, "dur": 3.898, "args": { "External id": 14852,"Sequence number": 246647, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8347 } }, { "ph": "s", "id": 121, "pid": 1336754, "tid": 1336754, "ts": 1295650520507.652, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650520544.054, "dur": 159.996, "args": { "External id": 14853,"Sequence number": 246648, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8348 } }, { "ph": "s", "id": 120, "pid": 1336754, "tid": 1336754, "ts": 1295650520544.054, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650520564.389, "dur": 9.482, "args": { "External id": 14854,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520567.460, "dur": 6.026, "args": { "External id": 14855,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8350 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650520718.285, "dur": 101.755, "args": { "External id": 14856,"Sequence number": 246649, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8351 } }, { "ph": "s", "id": 119, "pid": 1336754, "tid": 1336754, "ts": 1295650520718.285, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650520732.857, "dur": 6.962, "args": { "External id": 14857,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520734.985, "dur": 4.349, "args": { "External id": 14858,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8353 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336754, "tid": 1336754, "ts": 1295650520846.901, "dur": 224.160, "args": { "External id": 14859,"Sequence number": 246650, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8354 } }, { "ph": "s", "id": 118, "pid": 1336754, "tid": 1336754, "ts": 1295650520846.901, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650520876.149, "dur": 165.366, "args": { "External id": 14860,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650520925.398, "dur": 7.559, "args": { "External id": 14861,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650520927.637, "dur": 4.609, "args": { "External id": 14862,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650520935.656, "dur": 4.109, "args": { "External id": 14863,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650520941.209, "dur": 3.965, "args": { "External id": 14864,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650520947.485, "dur": 3.576, "args": { "External id": 14865,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1336754, "ts": 1295650521054.967, "dur": 5.204, "args": { "External id": 14866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521076.595, "dur": 7.376, "args": { "External id": 14867,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521077.578, "dur": 6.206, "args": { "External id": 14868,"Sequence number": 246651, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8363 } }, { "ph": "s", "id": 117, "pid": 1336754, "tid": 1336754, "ts": 1295650521077.578, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650521101.083, "dur": 113.762, "args": { "External id": 14869,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650521102.407, "dur": 8.520, "args": { "External id": 14870,"Sequence number": 246652, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8365 } }, { "ph": "s", "id": 116, "pid": 1336754, "tid": 1336754, "ts": 1295650521102.407, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650521105.590, "dur": 4.322, "args": { "External id": 14871,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521107.934, "dur": 1.719, "args": { "External id": 14872,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650521112.122, "dur": 102.397, "args": { "External id": 14873,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521116.707, "dur": 5.241, "args": { "External id": 14874,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521117.157, "dur": 4.660, "args": { "External id": 14875,"Sequence number": 246653, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8370 } }, { "ph": "s", "id": 115, "pid": 1336754, "tid": 1336754, "ts": 1295650521117.157, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650521122.908, "dur": 83.127, "args": { "External id": 14876,"Sequence number": 246654, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8371 } }, { "ph": "s", "id": 114, "pid": 1336754, "tid": 1336754, "ts": 1295650521122.908, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650521208.199, "dur": 5.631, "args": { "External id": 14877,"Sequence number": 246655, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8372 } }, { "ph": "s", "id": 113, "pid": 1336754, "tid": 1336754, "ts": 1295650521208.199, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650521264.700, "dur": 215.862, "args": { "External id": 14878,"Sequence number": 246656, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8373 } }, { "ph": "s", "id": 112, "pid": 1336754, "tid": 1336754, "ts": 1295650521264.700, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521288.082, "dur": 2.776, "args": { "External id": 14879,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521288.651, "dur": 1.936, "args": { "External id": 14880,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336754, "tid": 1336754, "ts": 1295650521294.836, "dur": 5.639, "args": { "External id": 14881,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521295.565, "dur": 4.809, "args": { "External id": 14882,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521299.109, "dur": 1.142, "args": { "External id": 14883,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650521307.605, "dur": 7.752, "args": { "External id": 14884,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521309.706, "dur": 5.365, "args": { "External id": 14885,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650521321.464, "dur": 4.274, "args": { "External id": 14886,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650521329.357, "dur": 3.464, "args": { "External id": 14887,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521456.066, "dur": 3.140, "args": { "External id": 14888,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521457.263, "dur": 1.771, "args": { "External id": 14889,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521463.791, "dur": 2.778, "args": { "External id": 14890,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521465.179, "dur": 1.269, "args": { "External id": 14891,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650521499.034, "dur": 96.925, "args": { "External id": 14892,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650521500.219, "dur": 7.298, "args": { "External id": 14893,"Sequence number": 246657, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8388 } }, { "ph": "s", "id": 111, "pid": 1336754, "tid": 1336754, "ts": 1295650521500.219, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650521502.620, "dur": 3.859, "args": { "External id": 14894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521504.504, "dur": 1.671, "args": { "External id": 14895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650521510.445, "dur": 85.138, "args": { "External id": 14896,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521512.566, "dur": 2.861, "args": { "External id": 14897,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521513.031, "dur": 2.269, "args": { "External id": 14898,"Sequence number": 246658, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8393 } }, { "ph": "s", "id": 110, "pid": 1336754, "tid": 1336754, "ts": 1295650521513.031, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650521516.032, "dur": 72.471, "args": { "External id": 14899,"Sequence number": 246659, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8394 } }, { "ph": "s", "id": 109, "pid": 1336754, "tid": 1336754, "ts": 1295650521516.032, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650521590.646, "dur": 4.376, "args": { "External id": 14900,"Sequence number": 246660, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8395 } }, { "ph": "s", "id": 108, "pid": 1336754, "tid": 1336754, "ts": 1295650521590.646, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650521603.766, "dur": 68.791, "args": { "External id": 14901,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650521604.292, "dur": 5.596, "args": { "External id": 14902,"Sequence number": 246661, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8397 } }, { "ph": "s", "id": 107, "pid": 1336754, "tid": 1336754, "ts": 1295650521604.292, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650521606.552, "dur": 2.246, "args": { "External id": 14903,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521607.681, "dur": 0.942, "args": { "External id": 14904,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650521610.442, "dur": 61.806, "args": { "External id": 14905,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521613.339, "dur": 7.268, "args": { "External id": 14906,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521614.255, "dur": 6.185, "args": { "External id": 14907,"Sequence number": 246662, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8402 } }, { "ph": "s", "id": 106, "pid": 1336754, "tid": 1336754, "ts": 1295650521614.255, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650521621.340, "dur": 44.338, "args": { "External id": 14908,"Sequence number": 246663, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8403 } }, { "ph": "s", "id": 105, "pid": 1336754, "tid": 1336754, "ts": 1295650521621.340, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650521667.219, "dur": 4.708, "args": { "External id": 14909,"Sequence number": 246664, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8404 } }, { "ph": "s", "id": 104, "pid": 1336754, "tid": 1336754, "ts": 1295650521667.219, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650521695.437, "dur": 142.065, "args": { "External id": 14910,"Sequence number": 246665, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8405 } }, { "ph": "s", "id": 103, "pid": 1336754, "tid": 1336754, "ts": 1295650521695.437, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650521732.172, "dur": 4.062, "args": { "External id": 14911,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650521769.499, "dur": 55.697, "args": { "External id": 14912,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650521770.401, "dur": 4.417, "args": { "External id": 14913,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650521771.436, "dur": 2.663, "args": { "External id": 14914,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521773.012, "dur": 0.892, "args": { "External id": 14915,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650521777.481, "dur": 47.409, "args": { "External id": 14916,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521778.620, "dur": 1.785, "args": { "External id": 14917,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521779.092, "dur": 1.182, "args": { "External id": 14918,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650521781.098, "dur": 39.981, "args": { "External id": 14919,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650521822.958, "dur": 1.352, "args": { "External id": 14920,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295650521845.996, "dur": 25.911, "args": { "External id": 14921,"Sequence number": 246666, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8416 } }, { "ph": "s", "id": 102, "pid": 1336754, "tid": 1336754, "ts": 1295650521845.996, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650521904.588, "dur": 216.204, "args": { "External id": 14922,"Sequence number": 246667, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8417 } }, { "ph": "s", "id": 101, "pid": 1336754, "tid": 1336754, "ts": 1295650521904.588, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650521924.269, "dur": 2.907, "args": { "External id": 14923,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650521925.272, "dur": 1.767, "args": { "External id": 14924,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650521934.765, "dur": 6.444, "args": { "External id": 14925,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650521936.839, "dur": 3.983, "args": { "External id": 14926,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650521946.272, "dur": 3.323, "args": { "External id": 14927,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522101.146, "dur": 4.155, "args": { "External id": 14928,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522102.327, "dur": 2.607, "args": { "External id": 14929,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650522141.377, "dur": 115.854, "args": { "External id": 14930,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650522142.765, "dur": 7.644, "args": { "External id": 14931,"Sequence number": 246668, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8426 } }, { "ph": "s", "id": 100, "pid": 1336754, "tid": 1336754, "ts": 1295650522142.765, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650522145.067, "dur": 3.825, "args": { "External id": 14932,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522146.945, "dur": 1.655, "args": { "External id": 14933,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650522151.507, "dur": 105.317, "args": { "External id": 14934,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522155.280, "dur": 3.536, "args": { "External id": 14935,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522155.971, "dur": 2.720, "args": { "External id": 14936,"Sequence number": 246669, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8431 } }, { "ph": "s", "id": 99, "pid": 1336754, "tid": 1336754, "ts": 1295650522155.971, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650522159.407, "dur": 86.772, "args": { "External id": 14937,"Sequence number": 246670, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8432 } }, { "ph": "s", "id": 98, "pid": 1336754, "tid": 1336754, "ts": 1295650522159.407, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650522249.772, "dur": 6.255, "args": { "External id": 14938,"Sequence number": 246671, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8433 } }, { "ph": "s", "id": 97, "pid": 1336754, "tid": 1336754, "ts": 1295650522249.772, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650522267.153, "dur": 68.434, "args": { "External id": 14939,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650522270.015, "dur": 5.425, "args": { "External id": 14940,"Sequence number": 246672, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8435 } }, { "ph": "s", "id": 96, "pid": 1336754, "tid": 1336754, "ts": 1295650522270.015, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650522271.877, "dur": 2.534, "args": { "External id": 14941,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522273.171, "dur": 1.101, "args": { "External id": 14942,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650522276.249, "dur": 59.084, "args": { "External id": 14943,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522277.230, "dur": 5.453, "args": { "External id": 14944,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522280.082, "dur": 2.458, "args": { "External id": 14945,"Sequence number": 246673, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8440 } }, { "ph": "s", "id": 95, "pid": 1336754, "tid": 1336754, "ts": 1295650522280.082, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650522283.197, "dur": 47.449, "args": { "External id": 14946,"Sequence number": 246674, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8441 } }, { "ph": "s", "id": 94, "pid": 1336754, "tid": 1336754, "ts": 1295650522283.197, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650522332.290, "dur": 2.689, "args": { "External id": 14947,"Sequence number": 246675, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8442 } }, { "ph": "s", "id": 93, "pid": 1336754, "tid": 1336754, "ts": 1295650522332.290, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650522342.604, "dur": 61.814, "args": { "External id": 14948,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650522343.373, "dur": 9.129, "args": { "External id": 14949,"Sequence number": 246676, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8444 } }, { "ph": "s", "id": 92, "pid": 1336754, "tid": 1336754, "ts": 1295650522343.373, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650522346.374, "dur": 5.146, "args": { "External id": 14950,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522347.846, "dur": 3.480, "args": { "External id": 14951,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650522353.194, "dur": 51.015, "args": { "External id": 14952,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522353.932, "dur": 6.293, "args": { "External id": 14953,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522357.086, "dur": 2.998, "args": { "External id": 14954,"Sequence number": 246677, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8449 } }, { "ph": "s", "id": 91, "pid": 1336754, "tid": 1336754, "ts": 1295650522357.086, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650522360.812, "dur": 37.667, "args": { "External id": 14955,"Sequence number": 246678, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8450 } }, { "ph": "s", "id": 90, "pid": 1336754, "tid": 1336754, "ts": 1295650522360.812, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650522399.998, "dur": 3.925, "args": { "External id": 14956,"Sequence number": 246679, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8451 } }, { "ph": "s", "id": 89, "pid": 1336754, "tid": 1336754, "ts": 1295650522399.998, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522419.654, "dur": 5.771, "args": { "External id": 14957,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522420.387, "dur": 4.894, "args": { "External id": 14958,"Sequence number": 246680, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8453 } }, { "ph": "s", "id": 88, "pid": 1336754, "tid": 1336754, "ts": 1295650522420.387, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522431.804, "dur": 3.405, "args": { "External id": 14959,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522433.030, "dur": 2.052, "args": { "External id": 14960,"Sequence number": 246681, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8455 } }, { "ph": "s", "id": 87, "pid": 1336754, "tid": 1336754, "ts": 1295650522433.030, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522439.188, "dur": 3.311, "args": { "External id": 14961,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522440.145, "dur": 2.223, "args": { "External id": 14962,"Sequence number": 246682, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8457 } }, { "ph": "s", "id": 86, "pid": 1336754, "tid": 1336754, "ts": 1295650522440.145, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650522472.936, "dur": 162.341, "args": { "External id": 14963,"Sequence number": 246683, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8458 } }, { "ph": "s", "id": 85, "pid": 1336754, "tid": 1336754, "ts": 1295650522472.936, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650522495.602, "dur": 10.715, "args": { "External id": 14964,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522498.817, "dur": 6.909, "args": { "External id": 14965,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8460 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650522647.276, "dur": 109.891, "args": { "External id": 14966,"Sequence number": 246684, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8461 } }, { "ph": "s", "id": 84, "pid": 1336754, "tid": 1336754, "ts": 1295650522647.276, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650522661.333, "dur": 6.952, "args": { "External id": 14967,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522663.679, "dur": 4.292, "args": { "External id": 14968,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8463 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336754, "tid": 1336754, "ts": 1295650522786.169, "dur": 172.863, "args": { "External id": 14969,"Sequence number": 246685, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8464 } }, { "ph": "s", "id": 83, "pid": 1336754, "tid": 1336754, "ts": 1295650522786.169, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650522812.306, "dur": 122.143, "args": { "External id": 14970,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650522859.083, "dur": 6.619, "args": { "External id": 14971,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650522861.168, "dur": 4.095, "args": { "External id": 14972,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650522868.170, "dur": 3.713, "args": { "External id": 14973,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650522873.339, "dur": 1.424, "args": { "External id": 14974,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650522877.395, "dur": 3.273, "args": { "External id": 14975,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1336754, "ts": 1295650522945.937, "dur": 3.916, "args": { "External id": 14976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650522964.080, "dur": 4.685, "args": { "External id": 14977,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650522965.084, "dur": 3.500, "args": { "External id": 14978,"Sequence number": 246686, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8473 } }, { "ph": "s", "id": 82, "pid": 1336754, "tid": 1336754, "ts": 1295650522965.084, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650522979.390, "dur": 160.650, "args": { "External id": 14979,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650522980.833, "dur": 54.180, "args": { "External id": 14980,"Sequence number": 246687, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8475 } }, { "ph": "s", "id": 81, "pid": 1336754, "tid": 1336754, "ts": 1295650522980.833, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650523026.897, "dur": 6.595, "args": { "External id": 14981,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523031.342, "dur": 1.663, "args": { "External id": 14982,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650523036.380, "dur": 103.274, "args": { "External id": 14983,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523038.376, "dur": 3.873, "args": { "External id": 14984,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523039.061, "dur": 3.079, "args": { "External id": 14985,"Sequence number": 246688, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8480 } }, { "ph": "s", "id": 80, "pid": 1336754, "tid": 1336754, "ts": 1295650523039.061, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650523043.138, "dur": 87.941, "args": { "External id": 14986,"Sequence number": 246689, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8481 } }, { "ph": "s", "id": 79, "pid": 1336754, "tid": 1336754, "ts": 1295650523043.138, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650523133.195, "dur": 5.712, "args": { "External id": 14987,"Sequence number": 246690, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8482 } }, { "ph": "s", "id": 78, "pid": 1336754, "tid": 1336754, "ts": 1295650523133.195, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650523177.259, "dur": 233.509, "args": { "External id": 14988,"Sequence number": 246691, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8483 } }, { "ph": "s", "id": 77, "pid": 1336754, "tid": 1336754, "ts": 1295650523177.259, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523195.911, "dur": 2.756, "args": { "External id": 14989,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523196.745, "dur": 1.755, "args": { "External id": 14990,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336754, "tid": 1336754, "ts": 1295650523202.674, "dur": 5.112, "args": { "External id": 14991,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523205.628, "dur": 2.036, "args": { "External id": 14992,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523206.568, "dur": 0.972, "args": { "External id": 14993,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650523215.184, "dur": 7.650, "args": { "External id": 14994,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523217.626, "dur": 4.912, "args": { "External id": 14995,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650523243.891, "dur": 4.510, "args": { "External id": 14996,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650523253.108, "dur": 4.058, "args": { "External id": 14997,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523387.092, "dur": 3.853, "args": { "External id": 14998,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523388.220, "dur": 2.547, "args": { "External id": 14999,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523393.648, "dur": 2.092, "args": { "External id": 15000,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523394.683, "dur": 0.937, "args": { "External id": 15001,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650523429.284, "dur": 111.373, "args": { "External id": 15002,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650523438.138, "dur": 9.292, "args": { "External id": 15003,"Sequence number": 246692, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8498 } }, { "ph": "s", "id": 76, "pid": 1336754, "tid": 1336754, "ts": 1295650523438.138, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650523443.037, "dur": 3.260, "args": { "External id": 15004,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523444.647, "dur": 1.422, "args": { "External id": 15005,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650523448.439, "dur": 91.703, "args": { "External id": 15006,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523449.884, "dur": 7.521, "args": { "External id": 15007,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523450.570, "dur": 6.649, "args": { "External id": 15008,"Sequence number": 246693, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8503 } }, { "ph": "s", "id": 75, "pid": 1336754, "tid": 1336754, "ts": 1295650523450.570, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650523458.331, "dur": 70.963, "args": { "External id": 15009,"Sequence number": 246694, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8504 } }, { "ph": "s", "id": 74, "pid": 1336754, "tid": 1336754, "ts": 1295650523458.331, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650523531.489, "dur": 7.900, "args": { "External id": 15010,"Sequence number": 246695, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8505 } }, { "ph": "s", "id": 73, "pid": 1336754, "tid": 1336754, "ts": 1295650523531.489, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650523548.938, "dur": 71.590, "args": { "External id": 15011,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650523549.472, "dur": 7.794, "args": { "External id": 15012,"Sequence number": 246696, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8507 } }, { "ph": "s", "id": 72, "pid": 1336754, "tid": 1336754, "ts": 1295650523549.472, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650523551.400, "dur": 4.688, "args": { "External id": 15013,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523554.701, "dur": 1.239, "args": { "External id": 15014,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650523557.977, "dur": 62.270, "args": { "External id": 15015,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523559.079, "dur": 4.798, "args": { "External id": 15016,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523560.110, "dur": 3.574, "args": { "External id": 15017,"Sequence number": 246697, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8512 } }, { "ph": "s", "id": 71, "pid": 1336754, "tid": 1336754, "ts": 1295650523560.110, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650523566.428, "dur": 48.539, "args": { "External id": 15018,"Sequence number": 246698, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8513 } }, { "ph": "s", "id": 70, "pid": 1336754, "tid": 1336754, "ts": 1295650523566.428, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650523616.795, "dur": 3.150, "args": { "External id": 15019,"Sequence number": 246699, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8514 } }, { "ph": "s", "id": 69, "pid": 1336754, "tid": 1336754, "ts": 1295650523616.795, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650523639.612, "dur": 165.116, "args": { "External id": 15020,"Sequence number": 246700, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8515 } }, { "ph": "s", "id": 68, "pid": 1336754, "tid": 1336754, "ts": 1295650523639.612, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650523674.604, "dur": 4.865, "args": { "External id": 15021,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650523713.835, "dur": 78.104, "args": { "External id": 15022,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650523714.489, "dur": 4.352, "args": { "External id": 15023,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650523715.631, "dur": 2.485, "args": { "External id": 15024,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523717.205, "dur": 0.738, "args": { "External id": 15025,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650523719.548, "dur": 72.134, "args": { "External id": 15026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523721.108, "dur": 1.823, "args": { "External id": 15027,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523721.550, "dur": 1.248, "args": { "External id": 15028,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650523725.471, "dur": 62.624, "args": { "External id": 15029,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650523789.904, "dur": 1.180, "args": { "External id": 15030,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295650523812.416, "dur": 25.784, "args": { "External id": 15031,"Sequence number": 246701, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8526 } }, { "ph": "s", "id": 67, "pid": 1336754, "tid": 1336754, "ts": 1295650523812.416, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650523870.987, "dur": 229.933, "args": { "External id": 15032,"Sequence number": 246702, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [], [], [], [], []], "Ev Idx": 8527 } }, { "ph": "s", "id": 66, "pid": 1336754, "tid": 1336754, "ts": 1295650523870.987, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650523888.769, "dur": 3.076, "args": { "External id": 15033,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650523889.674, "dur": 1.932, "args": { "External id": 15034,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650523902.570, "dur": 8.877, "args": { "External id": 15035,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650523906.384, "dur": 4.691, "args": { "External id": 15036,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650523921.662, "dur": 6.556, "args": { "External id": 15037,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524085.327, "dur": 4.359, "args": { "External id": 15038,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524086.374, "dur": 2.774, "args": { "External id": 15039,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650524120.915, "dur": 94.276, "args": { "External id": 15040,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650524121.905, "dur": 9.486, "args": { "External id": 15041,"Sequence number": 246703, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8536 } }, { "ph": "s", "id": 65, "pid": 1336754, "tid": 1336754, "ts": 1295650524121.905, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650524124.475, "dur": 5.779, "args": { "External id": 15042,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524128.734, "dur": 1.298, "args": { "External id": 15043,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650524132.449, "dur": 82.493, "args": { "External id": 15044,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524133.865, "dur": 3.073, "args": { "External id": 15045,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524134.310, "dur": 2.505, "args": { "External id": 15046,"Sequence number": 246704, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8541 } }, { "ph": "s", "id": 64, "pid": 1336754, "tid": 1336754, "ts": 1295650524134.310, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650524139.763, "dur": 69.291, "args": { "External id": 15047,"Sequence number": 246705, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8542 } }, { "ph": "s", "id": 63, "pid": 1336754, "tid": 1336754, "ts": 1295650524139.763, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650524210.856, "dur": 3.532, "args": { "External id": 15048,"Sequence number": 246706, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8543 } }, { "ph": "s", "id": 62, "pid": 1336754, "tid": 1336754, "ts": 1295650524210.856, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650524223.274, "dur": 92.513, "args": { "External id": 15049,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650524224.046, "dur": 26.273, "args": { "External id": 15050,"Sequence number": 246707, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8545 } }, { "ph": "s", "id": 61, "pid": 1336754, "tid": 1336754, "ts": 1295650524224.046, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650524225.853, "dur": 22.730, "args": { "External id": 15051,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524244.564, "dur": 3.372, "args": { "External id": 15052,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650524251.001, "dur": 64.499, "args": { "External id": 15053,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524252.347, "dur": 3.959, "args": { "External id": 15054,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524253.049, "dur": 3.116, "args": { "External id": 15055,"Sequence number": 246708, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8550 } }, { "ph": "s", "id": 60, "pid": 1336754, "tid": 1336754, "ts": 1295650524253.049, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650524256.907, "dur": 49.034, "args": { "External id": 15056,"Sequence number": 246709, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8551 } }, { "ph": "s", "id": 59, "pid": 1336754, "tid": 1336754, "ts": 1295650524256.907, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650524307.608, "dur": 7.360, "args": { "External id": 15057,"Sequence number": 246710, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8552 } }, { "ph": "s", "id": 58, "pid": 1336754, "tid": 1336754, "ts": 1295650524307.608, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650524323.995, "dur": 61.370, "args": { "External id": 15058,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650524324.787, "dur": 5.099, "args": { "External id": 15059,"Sequence number": 246711, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8554 } }, { "ph": "s", "id": 57, "pid": 1336754, "tid": 1336754, "ts": 1295650524324.787, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650524326.434, "dur": 2.305, "args": { "External id": 15060,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524327.870, "dur": 0.724, "args": { "External id": 15061,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650524332.687, "dur": 52.372, "args": { "External id": 15062,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524333.685, "dur": 4.537, "args": { "External id": 15063,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524334.584, "dur": 3.507, "args": { "External id": 15064,"Sequence number": 246712, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8559 } }, { "ph": "s", "id": 56, "pid": 1336754, "tid": 1336754, "ts": 1295650524334.584, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650524338.862, "dur": 39.973, "args": { "External id": 15065,"Sequence number": 246713, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8560 } }, { "ph": "s", "id": 55, "pid": 1336754, "tid": 1336754, "ts": 1295650524338.862, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650524380.227, "dur": 4.528, "args": { "External id": 15066,"Sequence number": 246714, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8561 } }, { "ph": "s", "id": 54, "pid": 1336754, "tid": 1336754, "ts": 1295650524380.227, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524400.703, "dur": 3.762, "args": { "External id": 15067,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524401.764, "dur": 2.586, "args": { "External id": 15068,"Sequence number": 246715, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8563 } }, { "ph": "s", "id": 53, "pid": 1336754, "tid": 1336754, "ts": 1295650524401.764, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524410.595, "dur": 3.253, "args": { "External id": 15069,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524411.716, "dur": 2.007, "args": { "External id": 15070,"Sequence number": 246716, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8565 } }, { "ph": "s", "id": 52, "pid": 1336754, "tid": 1336754, "ts": 1295650524411.716, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524420.008, "dur": 5.542, "args": { "External id": 15071,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524421.382, "dur": 4.010, "args": { "External id": 15072,"Sequence number": 246717, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 32, 64]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8567 } }, { "ph": "s", "id": 51, "pid": 1336754, "tid": 1336754, "ts": 1295650524421.382, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650524454.721, "dur": 145.061, "args": { "External id": 15073,"Sequence number": 246718, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8568 } }, { "ph": "s", "id": 50, "pid": 1336754, "tid": 1336754, "ts": 1295650524454.721, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650524473.466, "dur": 8.391, "args": { "External id": 15074,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524476.303, "dur": 5.160, "args": { "External id": 15075,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8570 } }, { "ph": "X", "cat": "cpu_op", "name": "RotaryEmbeddingFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650524611.309, "dur": 102.263, "args": { "External id": 15076,"Sequence number": 246719, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "False", "False", "0", "", "8192"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [32, 1], [32, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [8192, 32], [8192, 32], [], [], [], [], []], "Ev Idx": 8571 } }, { "ph": "s", "id": 49, "pid": 1336754, "tid": 1336754, "ts": 1295650524611.309, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650524626.291, "dur": 6.971, "args": { "External id": 15077,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524628.550, "dur": 4.267, "args": { "External id": 15078,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8573 } }, { "ph": "X", "cat": "cpu_op", "name": "FlashAttnFunc", "pid": 1336754, "tid": 1336754, "ts": 1295650524740.008, "dur": 173.784, "args": { "External id": 15079,"Sequence number": 246720, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "", "True", "", "0.", "", "False", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "", "Scalar", "", "Scalar", "", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], [], []], "Ev Idx": 8574 } }, { "ph": "s", "id": 48, "pid": 1336754, "tid": 1336754, "ts": 1295650524740.008, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "flash_attn::_flash_attn_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650524767.169, "dur": 122.200, "args": { "External id": 15080,"Record function id": 0, "Concrete Inputs": ["", "", "", "0.", "0.125", "True", "-1", "-1", "0.", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [8388608, 2048, 64, 1], [], [], [], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [16, 4096, 32, 64], [16, 4096, 32, 64], [], [], [], [], [], [], [], []], "Ev Idx": 8575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650524815.374, "dur": 7.610, "args": { "External id": 15081,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", ""], "Input type": ["c10::BFloat16", "", "", "", "", ""], "Input Strides": [[8388608, 2048, 64, 1], [], [], [], [], []], "Input Dims": [[16, 4096, 32, 64], [], [], [], [], []], "Ev Idx": 8576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524817.815, "dur": 4.418, "args": { "External id": 15082,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 32, 64]", "[8388608, 2048, 64, 1]", "15", "0", "", ""], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650524825.659, "dur": 4.773, "args": { "External id": 15083,"Record function id": 0, "Concrete Inputs": ["[16, 32, 4096]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650524831.709, "dur": 3.538, "args": { "External id": 15084,"Record function id": 0, "Concrete Inputs": ["[0]", "15", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650524837.430, "dur": 2.747, "args": { "External id": 15085,"Record function id": 0, "Concrete Inputs": ["[2]", "4", "", "", "", ""], "Input type": ["ScalarList", "Scalar", "", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::alias", "pid": 1336754, "tid": 1336754, "ts": 1295650524900.533, "dur": 4.347, "args": { "External id": 15086,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[8388608, 2048, 64, 1]], "Input Dims": [[16, 4096, 32, 64]], "Ev Idx": 8581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524918.621, "dur": 4.602, "args": { "External id": 15087,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524919.560, "dur": 3.540, "args": { "External id": 15088,"Sequence number": 246721, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, -1]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 64, 1], []], "Input Dims": [[16, 4096, 32, 64], []], "Ev Idx": 8583 } }, { "ph": "s", "id": 47, "pid": 1336754, "tid": 1336754, "ts": 1295650524919.560, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650524934.062, "dur": 148.371, "args": { "External id": 15089,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [2048, 2048], []], "Ev Idx": 8584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650524937.488, "dur": 7.853, "args": { "External id": 15090,"Sequence number": 246722, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[2048, 2048]], "Ev Idx": 8585 } }, { "ph": "s", "id": 46, "pid": 1336754, "tid": 1336754, "ts": 1295650524937.488, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650524940.206, "dur": 3.991, "args": { "External id": 15091,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[2048, 2048], [], []], "Ev Idx": 8586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650524942.571, "dur": 1.341, "args": { "External id": 15092,"Record function id": 0, "Concrete Inputs": ["", "[2048, 2048]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[2048, 2048], [], [], []], "Ev Idx": 8587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650524946.299, "dur": 135.855, "args": { "External id": 15093,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 2048]], "Ev Idx": 8588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650524948.079, "dur": 4.997, "args": { "External id": 15094,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650524950.737, "dur": 2.216, "args": { "External id": 15095,"Sequence number": 246723, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8590 } }, { "ph": "s", "id": 45, "pid": 1336754, "tid": 1336754, "ts": 1295650524950.737, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650524953.881, "dur": 118.868, "args": { "External id": 15096,"Sequence number": 246724, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 2048]], "Ev Idx": 8591 } }, { "ph": "s", "id": 44, "pid": 1336754, "tid": 1336754, "ts": 1295650524953.881, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650525076.484, "dur": 4.896, "args": { "External id": 15097,"Sequence number": 246725, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8592 } }, { "ph": "s", "id": 43, "pid": 1336754, "tid": 1336754, "ts": 1295650525076.484, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "LayerNormFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650525119.596, "dur": 242.411, "args": { "External id": 15098,"Sequence number": 246726, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "9.9999999999999995e-07", "True", "False", "True"], "Input type": ["c10::BFloat16", "c10::BFloat16", "", "c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8388608, 2048, 1], [1], [], [8388608, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [2048], [], [16, 4096, 2048], [], [], [], []], "Ev Idx": 8593 } }, { "ph": "s", "id": 42, "pid": 1336754, "tid": 1336754, "ts": 1295650525119.596, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525141.798, "dur": 2.820, "args": { "External id": 15099,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525142.583, "dur": 1.886, "args": { "External id": 15100,"Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape_as", "pid": 1336754, "tid": 1336754, "ts": 1295650525149.677, "dur": 3.205, "args": { "External id": 15101,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [2048, 1]], "Input Dims": [[16, 4096, 2048], [65536, 2048]], "Ev Idx": 8596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525150.891, "dur": 1.867, "args": { "External id": 15102,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525151.642, "dur": 1.003, "args": { "External id": 15103,"Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650525160.429, "dur": 9.574, "args": { "External id": 15104,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650525164.645, "dur": 4.951, "args": { "External id": 15105,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650525175.903, "dur": 3.779, "args": { "External id": 15106,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650525182.858, "dur": 4.574, "args": { "External id": 15107,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525338.436, "dur": 4.027, "args": { "External id": 15108,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525339.468, "dur": 2.693, "args": { "External id": 15109,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525345.260, "dur": 2.435, "args": { "External id": 15110,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525346.192, "dur": 1.384, "args": { "External id": 15111,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650525382.465, "dur": 104.270, "args": { "External id": 15112,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650525383.826, "dur": 10.541, "args": { "External id": 15113,"Sequence number": 246727, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8608 } }, { "ph": "s", "id": 41, "pid": 1336754, "tid": 1336754, "ts": 1295650525383.826, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650525386.539, "dur": 6.459, "args": { "External id": 15114,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650525388.989, "dur": 3.696, "args": { "External id": 15115,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650525395.386, "dur": 90.994, "args": { "External id": 15116,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525397.130, "dur": 5.763, "args": { "External id": 15117,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525399.945, "dur": 2.793, "args": { "External id": 15118,"Sequence number": 246728, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8613 } }, { "ph": "s", "id": 40, "pid": 1336754, "tid": 1336754, "ts": 1295650525399.945, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650525403.722, "dur": 74.698, "args": { "External id": 15119,"Sequence number": 246729, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8614 } }, { "ph": "s", "id": 39, "pid": 1336754, "tid": 1336754, "ts": 1295650525403.722, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650525480.506, "dur": 5.194, "args": { "External id": 15120,"Sequence number": 246730, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8615 } }, { "ph": "s", "id": 38, "pid": 1336754, "tid": 1336754, "ts": 1295650525480.506, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650525495.108, "dur": 75.235, "args": { "External id": 15121,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[8388608, 2048, 1], [2048, 1], []], "Input Dims": [[16, 4096, 2048], [5632, 2048], []], "Ev Idx": 8616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650525495.894, "dur": 8.564, "args": { "External id": 15122,"Sequence number": 246731, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[5632, 2048]], "Ev Idx": 8617 } }, { "ph": "s", "id": 37, "pid": 1336754, "tid": 1336754, "ts": 1295650525495.894, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650525500.254, "dur": 3.034, "args": { "External id": 15123,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[5632, 2048], [], []], "Ev Idx": 8618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650525502.222, "dur": 0.880, "args": { "External id": 15124,"Record function id": 0, "Concrete Inputs": ["", "[2048, 5632]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[5632, 2048], [], [], []], "Ev Idx": 8619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650525505.688, "dur": 64.312, "args": { "External id": 15125,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[8388608, 2048, 1], [1, 2048]], "Input Dims": [[16, 4096, 2048], [2048, 5632]], "Ev Idx": 8620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525507.094, "dur": 7.145, "args": { "External id": 15126,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525510.245, "dur": 3.866, "args": { "External id": 15127,"Sequence number": 246732, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[65536, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8622 } }, { "ph": "s", "id": 36, "pid": 1336754, "tid": 1336754, "ts": 1295650525510.245, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650525514.869, "dur": 48.364, "args": { "External id": 15128,"Sequence number": 246733, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[65536, 2048], [2048, 5632]], "Ev Idx": 8623 } }, { "ph": "s", "id": 35, "pid": 1336754, "tid": 1336754, "ts": 1295650525514.869, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650525565.108, "dur": 4.462, "args": { "External id": 15129,"Sequence number": 246734, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[5632, 1], []], "Input Dims": [[65536, 5632], []], "Ev Idx": 8624 } }, { "ph": "s", "id": 34, "pid": 1336754, "tid": 1336754, "ts": 1295650525565.108, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "SwiGLULinearFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650525590.036, "dur": 146.166, "args": { "External id": 15130,"Sequence number": 246735, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8625 } }, { "ph": "s", "id": 33, "pid": 1336754, "tid": 1336754, "ts": 1295650525590.036, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650525629.493, "dur": 4.356, "args": { "External id": 15131,"Record function id": 0, "Concrete Inputs": ["[16, 4096, 5632]", "15", "", "", "", "0"], "Input type": ["ScalarList", "Scalar", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650525664.039, "dur": 61.535, "args": { "External id": 15132,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[23068672, 5632, 1], [5632, 1], []], "Input Dims": [[16, 4096, 5632], [2048, 5632], []], "Ev Idx": 8627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650525664.874, "dur": 6.704, "args": { "External id": 15133,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[5632, 1]], "Input Dims": [[2048, 5632]], "Ev Idx": 8628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650525665.946, "dur": 4.958, "args": { "External id": 15134,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[5632, 1], [], []], "Input Dims": [[2048, 5632], [], []], "Ev Idx": 8629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650525667.820, "dur": 2.877, "args": { "External id": 15135,"Record function id": 0, "Concrete Inputs": ["", "[5632, 2048]", "[1, 5632]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[5632, 1], [], [], []], "Input Dims": [[2048, 5632], [], [], []], "Ev Idx": 8630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650525672.518, "dur": 52.539, "args": { "External id": 15136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[23068672, 5632, 1], [1, 5632]], "Input Dims": [[16, 4096, 5632], [5632, 2048]], "Ev Idx": 8631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reshape", "pid": 1336754, "tid": 1336754, "ts": 1295650525674.079, "dur": 5.126, "args": { "External id": 15137,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525677.752, "dur": 1.325, "args": { "External id": 15138,"Record function id": 0, "Concrete Inputs": ["", "[65536, 5632]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[23068672, 5632, 1], []], "Input Dims": [[16, 4096, 5632], []], "Ev Idx": 8633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650525679.983, "dur": 41.575, "args": { "External id": 15139,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[5632, 1], [1, 5632]], "Input Dims": [[65536, 5632], [5632, 2048]], "Ev Idx": 8634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_unsafe_view", "pid": 1336754, "tid": 1336754, "ts": 1295650525723.414, "dur": 1.094, "args": { "External id": 15140,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295650525744.286, "dur": 26.252, "args": { "External id": 15141,"Sequence number": 246736, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[8388608, 2048, 1], [8388608, 2048, 1], []], "Input Dims": [[16, 4096, 2048], [16, 4096, 2048], []], "Ev Idx": 8636 } }, { "ph": "s", "id": 32, "pid": 1336754, "tid": 1336754, "ts": 1295650525744.286, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336754, "tid": 1336754, "ts": 1295650525787.636, "dur": 42.368, "args": { "External id": 15142,"Sequence number": 246737, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "-2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8637 } }, { "ph": "s", "id": 31, "pid": 1336754, "tid": 1336754, "ts": 1295650525787.636, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336754, "tid": 1336754, "ts": 1295650525797.364, "dur": 28.305, "args": { "External id": 15143,"Record function id": 0, "Concrete Inputs": ["", "2"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[[8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1], [8388608, 2048, 1]], []], "Input Dims": [[[16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048], [16, 4096, 2048]], []], "Ev Idx": 8638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650525827.106, "dur": 1.326, "args": { "External id": 15144,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 8192], []], "Ev Idx": 8639 } }, { "ph": "X", "cat": "cpu_op", "name": "TorchDynamo Cache Lookup", "pid": 1336754, "tid": 1336754, "ts": 1295650525864.334, "dur": 45.767, "args": { "External id": 15145,"Record function id": 0, "Ev Idx": 8640 } }, { "ph": "X", "cat": "cpu_op", "name": "Torch-Compiled Region: 2/0", "pid": 1336754, "tid": 1336754, "ts": 1295650525911.145, "dur": 245.767, "args": { "External id": 15146,"Record function id": 0, "Ev Idx": 8641 } }, { "ph": "X", "cat": "cpu_op", "name": "CompiledFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650525949.752, "dur": 197.597, "args": { "External id": 15147,"Sequence number": 246738, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1], [33554432, 8192, 2048, 1]], "Input Dims": [[2048], [16, 4096, 4, 2048]], "Ev Idx": 8642 } }, { "ph": "s", "id": 30, "pid": 1336754, "tid": 1336754, "ts": 1295650525949.752, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "layer_norm_fwd_kernel_0", "pid": 1336754, "tid": 1336754, "ts": 1295650526060.120, "dur": 45.776, "args": { "External id": 15148,"kernel_hash": "caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo", "Record function id": 0, "stream": 0, "Concrete Inputs": ["", "", "", "", "2048", "1", "9.9999999999999995e-07", "True", "2048", "False", "False", "True", "False"], "kernel_file": "/tmp/torchinductor_cvm/ao/caowdwy4dip5p7sg7hk44j6kom6frhip3u2qpmolzfoijzloazlo.py", "kernel_backend": "triton", "Input type": ["c10::BFloat16", "c10::BFloat16", "c10::BFloat16", "float", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], [1], [1], [], [], [], [], [], [], [], [], []], "Input Dims": [[262144, 2048], [262144, 2048], [2048], [262144], [], [], [], [], [], [], [], [], []], "Ev Idx": 8643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650526257.378, "dur": 42.734, "args": { "External id": 15149,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526259.944, "dur": 6.814, "args": { "External id": 15150,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526270.176, "dur": 29.633, "args": { "External id": 15151,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526273.159, "dur": 26.105, "args": { "External id": 15152,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650526305.149, "dur": 18.394, "args": { "External id": 15153,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526305.835, "dur": 2.897, "args": { "External id": 15154,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526311.500, "dur": 11.735, "args": { "External id": 15155,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526312.126, "dur": 10.728, "args": { "External id": 15156,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650526326.795, "dur": 15.976, "args": { "External id": 15157,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False"], "Input type": ["ScalarList", "", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526327.291, "dur": 2.758, "args": { "External id": 15158,"Record function id": 0, "Concrete Inputs": ["[1]", "", "", "", "False", ""], "Input type": ["ScalarList", "", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526330.688, "dur": 11.801, "args": { "External id": 15159,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[1]], "Ev Idx": 8654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526331.260, "dur": 10.845, "args": { "External id": 15160,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 8655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650526352.353, "dur": 0.713, "args": { "External id": 15161,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "False", "False", ""], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[8192, 1], [], [], [], [], [], [], []], "Input Dims": [[16, 8192], [], [], [], [], [], [], []], "Ev Idx": 8656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unfold", "pid": 1336754, "tid": 1336754, "ts": 1295650526360.323, "dur": 11.490, "args": { "External id": 15162,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "5", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526367.588, "dur": 2.417, "args": { "External id": 15163,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 8192], [], [], []], "Ev Idx": 8658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526378.493, "dur": 7.738, "args": { "External id": 15164,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526383.143, "dur": 1.288, "args": { "External id": 15165,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526387.312, "dur": 3.108, "args": { "External id": 15166,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526389.269, "dur": 0.518, "args": { "External id": 15167,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 5]", "[8192, 1, 1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526391.877, "dur": 3.070, "args": { "External id": 15168,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 5], [], [], [], []], "Ev Idx": 8663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526393.710, "dur": 0.707, "args": { "External id": 15169,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 5], [], [], []], "Ev Idx": 8664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526397.971, "dur": 3.384, "args": { "External id": 15170,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526400.246, "dur": 0.587, "args": { "External id": 15171,"Record function id": 0, "Concrete Inputs": ["", "[16, 8188, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526402.470, "dur": 3.033, "args": { "External id": 15172,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "4096", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 8188, 4], [], [], [], []], "Ev Idx": 8667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526404.268, "dur": 0.548, "args": { "External id": 15173,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 8188, 4], [], [], []], "Ev Idx": 8668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526406.336, "dur": 3.641, "args": { "External id": 15174,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4096, 4], [], [], [], []], "Ev Idx": 8669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526408.443, "dur": 1.020, "args": { "External id": 15175,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650526413.687, "dur": 5.274, "args": { "External id": 15176,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4096, 4], [], []], "Ev Idx": 8671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526417.365, "dur": 0.799, "args": { "External id": 15177,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4096, 4], [], [], []], "Ev Idx": 8672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526423.044, "dur": 3.399, "args": { "External id": 15178,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 8673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526424.886, "dur": 0.992, "args": { "External id": 15179,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650526431.871, "dur": 6.694, "args": { "External id": 15180,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 8675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526436.389, "dur": 1.005, "args": { "External id": 15181,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 8676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526439.619, "dur": 3.083, "args": { "External id": 15182,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 8677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526441.447, "dur": 0.695, "args": { "External id": 15183,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 8678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526445.032, "dur": 7.997, "args": { "External id": 15184,"Sequence number": 246739, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8679 } }, { "ph": "s", "id": 29, "pid": 1336754, "tid": 1336754, "ts": 1295650526445.032, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526450.604, "dur": 0.798, "args": { "External id": 15185,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526454.289, "dur": 5.526, "args": { "External id": 15186,"Sequence number": 246740, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 8681 } }, { "ph": "s", "id": 28, "pid": 1336754, "tid": 1336754, "ts": 1295650526454.289, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526458.165, "dur": 0.842, "args": { "External id": 15187,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650526460.756, "dur": 6.842, "args": { "External id": 15188,"Sequence number": 246741, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 8683 } }, { "ph": "s", "id": 27, "pid": 1336754, "tid": 1336754, "ts": 1295650526460.756, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526465.912, "dur": 0.735, "args": { "External id": 15189,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 8684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650526468.537, "dur": 6.369, "args": { "External id": 15190,"Sequence number": 246742, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 8685 } }, { "ph": "s", "id": 26, "pid": 1336754, "tid": 1336754, "ts": 1295650526468.537, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526471.781, "dur": 2.358, "args": { "External id": 15191,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 8686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650526479.519, "dur": 37.511, "args": { "External id": 15192,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650526481.635, "dur": 35.195, "args": { "External id": 15193,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526484.299, "dur": 5.857, "args": { "External id": 15194,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 8689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526486.432, "dur": 3.098, "args": { "External id": 15195,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650526491.475, "dur": 24.891, "args": { "External id": 15196,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 8691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650526539.161, "dur": 3.674, "args": { "External id": 15197,"Sequence number": 246743, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 8692 } }, { "ph": "s", "id": 25, "pid": 1336754, "tid": 1336754, "ts": 1295650526539.161, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650526545.331, "dur": 1.208, "args": { "External id": 15198,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 8693 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650526575.373, "dur": 72281.921, "args": { "External id": 15199,"Sequence number": 246744, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 8694 } }, { "ph": "s", "id": 24, "pid": 1336754, "tid": 1336754, "ts": 1295650526575.373, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650526589.347, "dur": 29.772, "args": { "External id": 15200,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650526590.226, "dur": 28.651, "args": { "External id": 15201,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526591.281, "dur": 6.932, "args": { "External id": 15202,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526592.434, "dur": 5.342, "args": { "External id": 15203,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650526599.015, "dur": 19.451, "args": { "External id": 15204,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 8699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526636.315, "dur": 24.397, "args": { "External id": 15205,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526637.410, "dur": 5.982, "args": { "External id": 15206,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 8701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526639.576, "dur": 3.502, "args": { "External id": 15207,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526644.132, "dur": 16.377, "args": { "External id": 15208,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 8703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526645.144, "dur": 15.058, "args": { "External id": 15209,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 8704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526664.487, "dur": 30.768, "args": { "External id": 15210,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650526665.665, "dur": 6.772, "args": { "External id": 15211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 8706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526669.259, "dur": 2.902, "args": { "External id": 15212,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526682.705, "dur": 12.381, "args": { "External id": 15213,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526683.204, "dur": 11.510, "args": { "External id": 15214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 8709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650526699.975, "dur": 19.511, "args": { "External id": 15215,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 8710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650526700.820, "dur": 5.420, "args": { "External id": 15216,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650526707.015, "dur": 12.223, "args": { "External id": 15217,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 8712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650526707.769, "dur": 11.073, "args": { "External id": 15218,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1336754, "ts": 1295650526727.636, "dur": 27.253, "args": { "External id": 15219,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650526758.954, "dur": 60.406, "args": { "External id": 15220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 8715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650526762.649, "dur": 56.186, "args": { "External id": 15221,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526767.863, "dur": 1.118, "args": { "External id": 15222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 8717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650526771.053, "dur": 25.951, "args": { "External id": 15223,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650526772.606, "dur": 24.195, "args": { "External id": 15224,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 8719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650526777.413, "dur": 3.322, "args": { "External id": 15225,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650526781.485, "dur": 14.815, "args": { "External id": 15226,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 8721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295650526823.600, "dur": 66003.808, "args": { "External id": 15227,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295650526825.673, "dur": 66000.090, "args": { "External id": 15228,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 8723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650592840.202, "dur": 8.974, "args": { "External id": 15229,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650592846.194, "dur": 1.347, "args": { "External id": 15230,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650592854.114, "dur": 117.016, "args": { "External id": 15231,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650592855.810, "dur": 8.720, "args": { "External id": 15232,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650592857.883, "dur": 5.807, "args": { "External id": 15233,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650592862.671, "dur": 0.786, "args": { "External id": 15234,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650592865.980, "dur": 104.554, "args": { "External id": 15235,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650592870.031, "dur": 99.679, "args": { "External id": 15236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650592974.812, "dur": 4.526, "args": { "External id": 15237,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650592977.095, "dur": 0.952, "args": { "External id": 15238,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650593013.403, "dur": 4.369, "args": { "External id": 15239,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593029.718, "dur": 7.920, "args": { "External id": 15240,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593032.022, "dur": 5.289, "args": { "External id": 15241,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650593183.189, "dur": 261.664, "args": { "External id": 15242,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593188.096, "dur": 2.593, "args": { "External id": 15243,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650593193.405, "dur": 250.769, "args": { "External id": 15244,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650593196.016, "dur": 0.506, "args": { "External id": 15245,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650593199.200, "dur": 44.471, "args": { "External id": 15246,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650593246.823, "dur": 6.746, "args": { "External id": 15247,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593252.172, "dur": 1.020, "args": { "External id": 15248,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650593255.854, "dur": 31.584, "args": { "External id": 15249,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593257.036, "dur": 2.078, "args": { "External id": 15250,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650593263.305, "dur": 23.830, "args": { "External id": 15251,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650593268.068, "dur": 3.582, "args": { "External id": 15252,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650593289.550, "dur": 29.444, "args": { "External id": 15253,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650593321.115, "dur": 18.027, "args": { "External id": 15254,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650593342.833, "dur": 20.142, "args": { "External id": 15255,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650593365.546, "dur": 16.597, "args": { "External id": 15256,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650593384.595, "dur": 25.367, "args": { "External id": 15257,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650593386.488, "dur": 1.838, "args": { "External id": 15258,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593393.071, "dur": 0.720, "args": { "External id": 15259,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650593412.565, "dur": 15.021, "args": { "External id": 15260,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650593429.839, "dur": 13.329, "args": { "External id": 15261,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650593453.322, "dur": 2.787, "args": { "External id": 15262,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650593463.483, "dur": 4.403, "args": { "External id": 15263,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593466.226, "dur": 0.774, "args": { "External id": 15264,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650593554.385, "dur": 79.349, "args": { "External id": 15265,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650593639.716, "dur": 7.284, "args": { "External id": 15266,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593644.722, "dur": 1.049, "args": { "External id": 15267,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650593648.553, "dur": 34.018, "args": { "External id": 15268,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650593689.197, "dur": 6.947, "args": { "External id": 15269,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650593691.046, "dur": 4.390, "args": { "External id": 15270,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593693.255, "dur": 1.954, "args": { "External id": 15271,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650593700.316, "dur": 51.021, "args": { "External id": 15272,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650593703.830, "dur": 47.014, "args": { "External id": 15273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650593756.464, "dur": 18.906, "args": { "External id": 15274,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650593781.262, "dur": 3.630, "args": { "External id": 15275,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593783.282, "dur": 0.764, "args": { "External id": 15276,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650593789.301, "dur": 53.804, "args": { "External id": 15277,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650593790.104, "dur": 6.371, "args": { "External id": 15278,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650593791.182, "dur": 4.588, "args": { "External id": 15279,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593794.641, "dur": 0.990, "args": { "External id": 15280,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650593797.062, "dur": 45.628, "args": { "External id": 15281,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650593797.624, "dur": 44.291, "args": { "External id": 15282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650593847.480, "dur": 5.955, "args": { "External id": 15283,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650593849.391, "dur": 2.880, "args": { "External id": 15284,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650593859.887, "dur": 1.733, "args": { "External id": 15285,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593871.540, "dur": 6.447, "args": { "External id": 15286,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593873.631, "dur": 4.065, "args": { "External id": 15287,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650593970.281, "dur": 242.981, "args": { "External id": 15288,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650593973.018, "dur": 2.233, "args": { "External id": 15289,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650593976.891, "dur": 235.842, "args": { "External id": 15290,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650593978.362, "dur": 0.313, "args": { "External id": 15291,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650594018.824, "dur": 30.326, "args": { "External id": 15292,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650594051.190, "dur": 4.067, "args": { "External id": 15293,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594053.376, "dur": 1.546, "args": { "External id": 15294,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650594056.594, "dur": 26.695, "args": { "External id": 15295,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650594057.538, "dur": 1.962, "args": { "External id": 15296,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650594060.759, "dur": 22.182, "args": { "External id": 15297,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650594065.796, "dur": 3.630, "args": { "External id": 15298,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650594084.931, "dur": 22.905, "args": { "External id": 15299,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650594109.390, "dur": 15.982, "args": { "External id": 15300,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650594128.355, "dur": 14.727, "args": { "External id": 15301,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650594146.805, "dur": 14.396, "args": { "External id": 15302,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650594163.103, "dur": 21.176, "args": { "External id": 15303,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650594165.158, "dur": 1.860, "args": { "External id": 15304,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594169.083, "dur": 0.730, "args": { "External id": 15305,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650594186.093, "dur": 13.420, "args": { "External id": 15306,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650594200.618, "dur": 11.013, "args": { "External id": 15307,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650594224.109, "dur": 2.282, "args": { "External id": 15308,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650594252.035, "dur": 4.918, "args": { "External id": 15309,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594254.883, "dur": 0.892, "args": { "External id": 15310,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650594335.357, "dur": 61.630, "args": { "External id": 15311,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650594402.185, "dur": 4.996, "args": { "External id": 15312,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594405.024, "dur": 1.105, "args": { "External id": 15313,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650594408.946, "dur": 29.086, "args": { "External id": 15314,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650594442.869, "dur": 7.028, "args": { "External id": 15315,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650594444.233, "dur": 5.061, "args": { "External id": 15316,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594448.283, "dur": 0.795, "args": { "External id": 15317,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650594452.880, "dur": 44.951, "args": { "External id": 15318,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650594454.128, "dur": 43.195, "args": { "External id": 15319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650594501.898, "dur": 19.989, "args": { "External id": 15320,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650594527.773, "dur": 3.747, "args": { "External id": 15321,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594529.989, "dur": 0.624, "args": { "External id": 15322,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650594537.874, "dur": 51.052, "args": { "External id": 15323,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650594538.946, "dur": 5.838, "args": { "External id": 15324,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650594539.822, "dur": 4.422, "args": { "External id": 15325,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594543.398, "dur": 0.660, "args": { "External id": 15326,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650594545.405, "dur": 43.071, "args": { "External id": 15327,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650594545.861, "dur": 42.085, "args": { "External id": 15328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650594593.314, "dur": 4.249, "args": { "External id": 15329,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594595.473, "dur": 1.053, "args": { "External id": 15330,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650594605.779, "dur": 1.531, "args": { "External id": 15331,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650594614.960, "dur": 6.177, "args": { "External id": 15332,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650594617.043, "dur": 3.832, "args": { "External id": 15333,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650594707.024, "dur": 338.455, "args": { "External id": 15334,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650594709.443, "dur": 2.286, "args": { "External id": 15335,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650594713.161, "dur": 331.793, "args": { "External id": 15336,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650594717.057, "dur": 0.269, "args": { "External id": 15337,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650594720.206, "dur": 21.619, "args": { "External id": 15338,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650594743.641, "dur": 4.080, "args": { "External id": 15339,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594745.849, "dur": 1.621, "args": { "External id": 15340,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650594748.536, "dur": 28.874, "args": { "External id": 15341,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650594751.709, "dur": 1.609, "args": { "External id": 15342,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650594754.397, "dur": 22.752, "args": { "External id": 15343,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650594756.509, "dur": 2.430, "args": { "External id": 15344,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650594778.799, "dur": 22.425, "args": { "External id": 15345,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650594802.658, "dur": 38.444, "args": { "External id": 15346,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650594843.634, "dur": 43.139, "args": { "External id": 15347,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650594890.444, "dur": 39.782, "args": { "External id": 15348,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650594932.081, "dur": 42.538, "args": { "External id": 15349,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650594933.910, "dur": 1.798, "args": { "External id": 15350,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650594937.604, "dur": 0.773, "args": { "External id": 15351,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650594976.134, "dur": 51.029, "args": { "External id": 15352,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650595029.615, "dur": 13.789, "args": { "External id": 15353,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650595056.033, "dur": 2.774, "args": { "External id": 15354,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595068.390, "dur": 3.946, "args": { "External id": 15355,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595070.774, "dur": 0.646, "args": { "External id": 15356,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650595141.177, "dur": 57.477, "args": { "External id": 15357,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595203.481, "dur": 7.168, "args": { "External id": 15358,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595206.145, "dur": 3.288, "args": { "External id": 15359,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650595212.268, "dur": 41.503, "args": { "External id": 15360,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650595295.752, "dur": 8.658, "args": { "External id": 15361,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650595299.977, "dur": 3.721, "args": { "External id": 15362,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595302.201, "dur": 1.269, "args": { "External id": 15363,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650595307.470, "dur": 48.513, "args": { "External id": 15364,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650595308.730, "dur": 46.739, "args": { "External id": 15365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650595360.060, "dur": 18.149, "args": { "External id": 15366,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595384.578, "dur": 6.358, "args": { "External id": 15367,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595389.160, "dur": 0.891, "args": { "External id": 15368,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650595395.113, "dur": 49.729, "args": { "External id": 15369,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650595395.680, "dur": 3.259, "args": { "External id": 15370,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650595396.469, "dur": 1.953, "args": { "External id": 15371,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595397.604, "dur": 0.677, "args": { "External id": 15372,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650595399.621, "dur": 44.779, "args": { "External id": 15373,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650595400.104, "dur": 43.647, "args": { "External id": 15374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595451.296, "dur": 4.161, "args": { "External id": 15375,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595453.746, "dur": 0.610, "args": { "External id": 15376,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650595461.741, "dur": 1.464, "args": { "External id": 15377,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650595470.775, "dur": 8.573, "args": { "External id": 15378,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650595472.636, "dur": 6.417, "args": { "External id": 15379,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650595570.634, "dur": 191.074, "args": { "External id": 15380,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650595572.633, "dur": 2.340, "args": { "External id": 15381,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650595576.484, "dur": 184.839, "args": { "External id": 15382,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650595577.854, "dur": 0.320, "args": { "External id": 15383,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650595579.299, "dur": 25.304, "args": { "External id": 15384,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650595606.410, "dur": 3.280, "args": { "External id": 15385,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595608.561, "dur": 0.689, "args": { "External id": 15386,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650595610.579, "dur": 26.878, "args": { "External id": 15387,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650595611.823, "dur": 2.118, "args": { "External id": 15388,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650595616.858, "dur": 20.319, "args": { "External id": 15389,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650595621.859, "dur": 2.899, "args": { "External id": 15390,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650595638.924, "dur": 21.008, "args": { "External id": 15391,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650595661.531, "dur": 14.590, "args": { "External id": 15392,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650595678.950, "dur": 14.665, "args": { "External id": 15393,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650595695.116, "dur": 14.090, "args": { "External id": 15394,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650595711.008, "dur": 23.187, "args": { "External id": 15395,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650595712.932, "dur": 1.729, "args": { "External id": 15396,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595718.462, "dur": 1.057, "args": { "External id": 15397,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650595735.405, "dur": 13.189, "args": { "External id": 15398,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650595749.591, "dur": 10.860, "args": { "External id": 15399,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650595767.731, "dur": 1.680, "args": { "External id": 15400,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595777.555, "dur": 3.207, "args": { "External id": 15401,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595779.533, "dur": 0.348, "args": { "External id": 15402,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650595843.136, "dur": 50.308, "args": { "External id": 15403,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650595897.712, "dur": 6.637, "args": { "External id": 15404,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595902.244, "dur": 1.017, "args": { "External id": 15405,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650595905.755, "dur": 23.911, "args": { "External id": 15406,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650595933.646, "dur": 4.616, "args": { "External id": 15407,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650595934.762, "dur": 2.912, "args": { "External id": 15408,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650595936.754, "dur": 0.711, "args": { "External id": 15409,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650595940.593, "dur": 77.431, "args": { "External id": 15410,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650595941.677, "dur": 74.648, "args": { "External id": 15411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650596025.848, "dur": 18.739, "args": { "External id": 15412,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596051.222, "dur": 4.904, "args": { "External id": 15413,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596053.948, "dur": 0.940, "args": { "External id": 15414,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650596059.871, "dur": 56.272, "args": { "External id": 15415,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650596060.601, "dur": 8.298, "args": { "External id": 15416,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650596061.498, "dur": 6.799, "args": { "External id": 15417,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596064.854, "dur": 3.238, "args": { "External id": 15418,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650596069.727, "dur": 46.097, "args": { "External id": 15419,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650596070.492, "dur": 44.837, "args": { "External id": 15420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596120.363, "dur": 4.229, "args": { "External id": 15421,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596122.712, "dur": 0.870, "args": { "External id": 15422,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650596131.266, "dur": 1.496, "args": { "External id": 15423,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596140.389, "dur": 8.600, "args": { "External id": 15424,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596144.635, "dur": 4.075, "args": { "External id": 15425,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650596247.983, "dur": 193.834, "args": { "External id": 15426,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596250.778, "dur": 3.514, "args": { "External id": 15427,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650596255.873, "dur": 185.545, "args": { "External id": 15428,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650596257.637, "dur": 0.486, "args": { "External id": 15429,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650596261.554, "dur": 24.026, "args": { "External id": 15430,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650596287.154, "dur": 3.470, "args": { "External id": 15431,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596289.134, "dur": 1.215, "args": { "External id": 15432,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650596291.332, "dur": 27.429, "args": { "External id": 15433,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596292.460, "dur": 3.684, "args": { "External id": 15434,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650596299.440, "dur": 19.105, "args": { "External id": 15435,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650596302.105, "dur": 3.190, "args": { "External id": 15436,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650596320.267, "dur": 21.770, "args": { "External id": 15437,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650596343.432, "dur": 13.515, "args": { "External id": 15438,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650596359.163, "dur": 15.403, "args": { "External id": 15439,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650596376.062, "dur": 13.646, "args": { "External id": 15440,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650596391.357, "dur": 22.235, "args": { "External id": 15441,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650596393.008, "dur": 1.591, "args": { "External id": 15442,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596398.302, "dur": 0.773, "args": { "External id": 15443,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650596414.706, "dur": 12.910, "args": { "External id": 15444,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650596428.861, "dur": 11.685, "args": { "External id": 15445,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650596449.202, "dur": 1.874, "args": { "External id": 15446,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596460.611, "dur": 3.378, "args": { "External id": 15447,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596462.648, "dur": 0.537, "args": { "External id": 15448,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650596529.433, "dur": 54.795, "args": { "External id": 15449,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596588.926, "dur": 6.739, "args": { "External id": 15450,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596593.787, "dur": 0.891, "args": { "External id": 15451,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650596597.056, "dur": 25.792, "args": { "External id": 15452,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650596627.172, "dur": 6.796, "args": { "External id": 15453,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650596628.401, "dur": 4.946, "args": { "External id": 15454,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596629.969, "dur": 3.132, "args": { "External id": 15455,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650596636.476, "dur": 42.602, "args": { "External id": 15456,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650596639.335, "dur": 39.064, "args": { "External id": 15457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650596682.701, "dur": 15.561, "args": { "External id": 15458,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596703.406, "dur": 3.665, "args": { "External id": 15459,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596705.457, "dur": 0.729, "args": { "External id": 15460,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650596710.711, "dur": 50.352, "args": { "External id": 15461,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 8956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650596711.749, "dur": 5.610, "args": { "External id": 15462,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 8957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650596712.444, "dur": 4.295, "args": { "External id": 15463,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 8958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596715.649, "dur": 0.953, "args": { "External id": 15464,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 8959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650596718.146, "dur": 42.563, "args": { "External id": 15465,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650596718.849, "dur": 41.448, "args": { "External id": 15466,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 8961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650596764.703, "dur": 3.905, "args": { "External id": 15467,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596766.601, "dur": 1.035, "args": { "External id": 15468,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650596784.846, "dur": 1.428, "args": { "External id": 15469,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 8964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596794.746, "dur": 7.783, "args": { "External id": 15470,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 8965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596796.301, "dur": 5.961, "args": { "External id": 15471,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650596883.307, "dur": 246.463, "args": { "External id": 15472,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596885.516, "dur": 2.573, "args": { "External id": 15473,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650596889.972, "dur": 239.187, "args": { "External id": 15474,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 8969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650596901.418, "dur": 0.299, "args": { "External id": 15475,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650596906.757, "dur": 23.075, "args": { "External id": 15476,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 8971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650596931.411, "dur": 5.960, "args": { "External id": 15477,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 8972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650596933.440, "dur": 3.653, "args": { "External id": 15478,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 8973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650596938.199, "dur": 23.474, "args": { "External id": 15479,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650596939.558, "dur": 1.946, "args": { "External id": 15480,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 8975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650596942.465, "dur": 18.931, "args": { "External id": 15481,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 8976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650596944.453, "dur": 3.837, "args": { "External id": 15482,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650596962.883, "dur": 19.491, "args": { "External id": 15483,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650596983.952, "dur": 54.519, "args": { "External id": 15484,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650597043.019, "dur": 16.075, "args": { "External id": 15485,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 8980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650597062.391, "dur": 12.445, "args": { "External id": 15486,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 8981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650597076.785, "dur": 24.451, "args": { "External id": 15487,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 8982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650597078.884, "dur": 2.048, "args": { "External id": 15488,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 8983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597082.561, "dur": 3.253, "args": { "External id": 15489,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 8984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650597102.528, "dur": 13.549, "args": { "External id": 15490,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 8985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650597117.062, "dur": 10.898, "args": { "External id": 15491,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 8986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650597140.207, "dur": 2.478, "args": { "External id": 15492,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 8987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597153.110, "dur": 3.820, "args": { "External id": 15493,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 8988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597155.527, "dur": 0.508, "args": { "External id": 15494,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 8989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650597242.128, "dur": 67.296, "args": { "External id": 15495,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 8990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597315.015, "dur": 5.883, "args": { "External id": 15496,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 8991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597318.262, "dur": 1.116, "args": { "External id": 15497,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 8992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650597322.513, "dur": 27.879, "args": { "External id": 15498,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 8993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650597355.573, "dur": 8.454, "args": { "External id": 15499,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 8994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650597357.386, "dur": 5.995, "args": { "External id": 15500,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 8995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597361.447, "dur": 1.681, "args": { "External id": 15501,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 8996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650597367.267, "dur": 43.772, "args": { "External id": 15502,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650597368.659, "dur": 41.798, "args": { "External id": 15503,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 8998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650597415.282, "dur": 17.480, "args": { "External id": 15504,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 8999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597438.194, "dur": 3.935, "args": { "External id": 15505,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597440.221, "dur": 0.904, "args": { "External id": 15506,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650597448.128, "dur": 50.817, "args": { "External id": 15507,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650597449.576, "dur": 3.883, "args": { "External id": 15508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650597450.572, "dur": 2.346, "args": { "External id": 15509,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597451.901, "dur": 0.828, "args": { "External id": 15510,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650597454.205, "dur": 44.387, "args": { "External id": 15511,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650597454.681, "dur": 43.358, "args": { "External id": 15512,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597503.372, "dur": 3.966, "args": { "External id": 15513,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597505.357, "dur": 0.655, "args": { "External id": 15514,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650597515.045, "dur": 1.508, "args": { "External id": 15515,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650597524.587, "dur": 6.270, "args": { "External id": 15516,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650597526.430, "dur": 4.188, "args": { "External id": 15517,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650597615.612, "dur": 189.450, "args": { "External id": 15518,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650597620.309, "dur": 2.126, "args": { "External id": 15519,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650597623.970, "dur": 180.485, "args": { "External id": 15520,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650597627.158, "dur": 0.312, "args": { "External id": 15521,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650597628.612, "dur": 20.596, "args": { "External id": 15522,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650597650.923, "dur": 5.565, "args": { "External id": 15523,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597655.333, "dur": 0.897, "args": { "External id": 15524,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650597657.495, "dur": 21.687, "args": { "External id": 15525,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650597658.929, "dur": 1.520, "args": { "External id": 15526,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650597661.666, "dur": 17.248, "args": { "External id": 15527,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650597663.801, "dur": 2.791, "args": { "External id": 15528,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650597680.328, "dur": 21.614, "args": { "External id": 15529,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650597703.152, "dur": 13.734, "args": { "External id": 15530,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650597719.248, "dur": 14.407, "args": { "External id": 15531,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650597736.788, "dur": 13.850, "args": { "External id": 15532,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650597752.351, "dur": 21.794, "args": { "External id": 15533,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650597756.151, "dur": 1.394, "args": { "External id": 15534,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597759.590, "dur": 0.630, "args": { "External id": 15535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650597775.856, "dur": 13.324, "args": { "External id": 15536,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650597790.225, "dur": 11.467, "args": { "External id": 15537,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650597811.127, "dur": 1.642, "args": { "External id": 15538,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597820.760, "dur": 3.718, "args": { "External id": 15539,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597823.190, "dur": 0.355, "args": { "External id": 15540,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650597882.634, "dur": 49.898, "args": { "External id": 15541,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650597937.040, "dur": 4.742, "args": { "External id": 15542,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597939.860, "dur": 0.944, "args": { "External id": 15543,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650597943.096, "dur": 25.249, "args": { "External id": 15544,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650597972.534, "dur": 7.696, "args": { "External id": 15545,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650597976.312, "dur": 3.260, "args": { "External id": 15546,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650597978.357, "dur": 0.998, "args": { "External id": 15547,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650597982.395, "dur": 87.277, "args": { "External id": 15548,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650597983.414, "dur": 84.933, "args": { "External id": 15549,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650598075.014, "dur": 17.271, "args": { "External id": 15550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598098.582, "dur": 6.244, "args": { "External id": 15551,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598103.083, "dur": 0.684, "args": { "External id": 15552,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650598108.702, "dur": 50.639, "args": { "External id": 15553,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650598109.531, "dur": 4.075, "args": { "External id": 15554,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650598110.564, "dur": 2.488, "args": { "External id": 15555,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598112.077, "dur": 0.830, "args": { "External id": 15556,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650598114.174, "dur": 44.803, "args": { "External id": 15557,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650598114.711, "dur": 43.785, "args": { "External id": 15558,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598165.168, "dur": 3.939, "args": { "External id": 15559,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598167.011, "dur": 1.049, "args": { "External id": 15560,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650598175.007, "dur": 1.339, "args": { "External id": 15561,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650598184.136, "dur": 6.628, "args": { "External id": 15562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650598186.093, "dur": 4.421, "args": { "External id": 15563,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650598298.045, "dur": 197.851, "args": { "External id": 15564,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650598302.777, "dur": 3.169, "args": { "External id": 15565,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650598307.347, "dur": 188.121, "args": { "External id": 15566,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650598308.795, "dur": 0.309, "args": { "External id": 15567,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650598310.693, "dur": 23.337, "args": { "External id": 15568,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650598335.454, "dur": 6.010, "args": { "External id": 15569,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598339.992, "dur": 0.999, "args": { "External id": 15570,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650598342.421, "dur": 24.628, "args": { "External id": 15571,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650598343.725, "dur": 1.480, "args": { "External id": 15572,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650598348.321, "dur": 18.487, "args": { "External id": 15573,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650598351.243, "dur": 2.841, "args": { "External id": 15574,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650598368.223, "dur": 21.412, "args": { "External id": 15575,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650598391.132, "dur": 16.677, "args": { "External id": 15576,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650598410.816, "dur": 15.046, "args": { "External id": 15577,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650598427.140, "dur": 13.199, "args": { "External id": 15578,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650598441.867, "dur": 22.644, "args": { "External id": 15579,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650598444.106, "dur": 2.048, "args": { "External id": 15580,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598449.805, "dur": 0.722, "args": { "External id": 15581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650598465.930, "dur": 13.456, "args": { "External id": 15582,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650598480.517, "dur": 13.765, "args": { "External id": 15583,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650598502.560, "dur": 1.948, "args": { "External id": 15584,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598513.481, "dur": 3.153, "args": { "External id": 15585,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598515.597, "dur": 0.338, "args": { "External id": 15586,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650598579.055, "dur": 53.251, "args": { "External id": 15587,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598637.224, "dur": 6.580, "args": { "External id": 15588,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598641.855, "dur": 0.859, "args": { "External id": 15589,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650598645.368, "dur": 22.940, "args": { "External id": 15590,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650598672.826, "dur": 5.179, "args": { "External id": 15591,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650598674.123, "dur": 3.316, "args": { "External id": 15592,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598675.999, "dur": 1.251, "args": { "External id": 15593,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650598680.409, "dur": 41.414, "args": { "External id": 15594,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650598681.416, "dur": 39.900, "args": { "External id": 15595,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650598728.660, "dur": 15.932, "args": { "External id": 15596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650598749.659, "dur": 27.272, "args": { "External id": 15597,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650598752.402, "dur": 24.094, "args": { "External id": 15598,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598757.542, "dur": 2.502, "args": { "External id": 15599,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650598782.884, "dur": 28.749, "args": { "External id": 15600,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650598784.531, "dur": 26.892, "args": { "External id": 15601,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598789.063, "dur": 4.093, "args": { "External id": 15602,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650598794.352, "dur": 16.632, "args": { "External id": 15603,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650598824.097, "dur": 7.965, "args": { "External id": 15604,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9099 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650598828.637, "dur": 3.163, "args": { "External id": 15605,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650598833.144, "dur": 1.320, "args": { "External id": 15606,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9101 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650598833.877, "dur": 0.499, "args": { "External id": 15607,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650598873.609, "dur": 21.684, "args": { "External id": 15608,"Sequence number": 246745, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9103 } }, { "ph": "s", "id": 23, "pid": 1336754, "tid": 1336754, "ts": 1295650598873.609, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598901.018, "dur": 5.814, "args": { "External id": 15609,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598904.468, "dur": 0.982, "args": { "External id": 15610,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650598909.628, "dur": 8.227, "args": { "External id": 15611,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "1"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598915.847, "dur": 0.803, "args": { "External id": 15612,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598919.090, "dur": 3.173, "args": { "External id": 15613,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598920.778, "dur": 0.915, "args": { "External id": 15614,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "2"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598926.585, "dur": 5.857, "args": { "External id": 15615,"Sequence number": 246746, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9110 } }, { "ph": "s", "id": 22, "pid": 1336754, "tid": 1336754, "ts": 1295650598926.585, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598930.060, "dur": 0.932, "args": { "External id": 15616,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598935.925, "dur": 5.308, "args": { "External id": 15617,"Sequence number": 246747, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9112 } }, { "ph": "s", "id": 21, "pid": 1336754, "tid": 1336754, "ts": 1295650598935.925, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598939.668, "dur": 0.804, "args": { "External id": 15618,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650598942.131, "dur": 5.306, "args": { "External id": 15619,"Sequence number": 246748, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9114 } }, { "ph": "s", "id": 20, "pid": 1336754, "tid": 1336754, "ts": 1295650598942.131, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598945.533, "dur": 1.108, "args": { "External id": 15620,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650598948.572, "dur": 4.477, "args": { "External id": 15621,"Sequence number": 246749, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9116 } }, { "ph": "s", "id": 19, "pid": 1336754, "tid": 1336754, "ts": 1295650598948.572, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650598951.489, "dur": 0.876, "args": { "External id": 15622,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "2048"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650598957.260, "dur": 75.847, "args": { "External id": 15623,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650598961.043, "dur": 71.810, "args": { "External id": 15624,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650598963.894, "dur": 8.188, "args": { "External id": 15625,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650598968.465, "dur": 3.084, "args": { "External id": 15626,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650598972.795, "dur": 59.262, "args": { "External id": 15627,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650599062.477, "dur": 5.354, "args": { "External id": 15628,"Sequence number": 246750, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9123 } }, { "ph": "s", "id": 18, "pid": 1336754, "tid": 1336754, "ts": 1295650599062.477, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650599070.209, "dur": 1.308, "args": { "External id": 15629,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9124 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650599105.455, "dur": 42272.230, "args": { "External id": 15630,"Sequence number": 246751, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9125 } }, { "ph": "s", "id": 17, "pid": 1336754, "tid": 1336754, "ts": 1295650599105.455, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650599120.317, "dur": 31.652, "args": { "External id": 15631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650599121.373, "dur": 30.385, "args": { "External id": 15632,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650599122.864, "dur": 7.049, "args": { "External id": 15633,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650599124.596, "dur": 4.821, "args": { "External id": 15634,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650599130.688, "dur": 20.638, "args": { "External id": 15635,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650599169.023, "dur": 28.506, "args": { "External id": 15636,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650599170.485, "dur": 5.768, "args": { "External id": 15637,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650599172.498, "dur": 3.430, "args": { "External id": 15638,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650599177.629, "dur": 19.646, "args": { "External id": 15639,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650599179.785, "dur": 17.114, "args": { "External id": 15640,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650599201.317, "dur": 22.311, "args": { "External id": 15641,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650599202.288, "dur": 7.100, "args": { "External id": 15642,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650599205.889, "dur": 3.026, "args": { "External id": 15643,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650599210.922, "dur": 12.507, "args": { "External id": 15644,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650599211.299, "dur": 11.740, "args": { "External id": 15645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650599244.460, "dur": 20.952, "args": { "External id": 15646,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650599246.301, "dur": 3.769, "args": { "External id": 15647,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650599251.105, "dur": 13.989, "args": { "External id": 15648,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650599252.182, "dur": 12.517, "args": { "External id": 15649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1336754, "ts": 1295650599271.245, "dur": 24.998, "args": { "External id": 15650,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650599301.113, "dur": 74.980, "args": { "External id": 15651,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650599324.403, "dur": 51.267, "args": { "External id": 15652,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650599329.755, "dur": 3.204, "args": { "External id": 15653,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650599334.441, "dur": 23.604, "args": { "External id": 15654,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650599336.102, "dur": 21.527, "args": { "External id": 15655,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650599338.727, "dur": 3.136, "args": { "External id": 15656,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650599342.668, "dur": 14.528, "args": { "External id": 15657,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295650599380.759, "dur": 36119.549, "args": { "External id": 15658,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295650599382.957, "dur": 36114.717, "args": { "External id": 15659,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650635516.860, "dur": 10.280, "args": { "External id": 15660,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650635523.707, "dur": 1.417, "args": { "External id": 15661,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650635532.799, "dur": 109.160, "args": { "External id": 15662,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650635534.913, "dur": 6.814, "args": { "External id": 15663,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650635537.518, "dur": 3.431, "args": { "External id": 15664,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650635539.569, "dur": 1.100, "args": { "External id": 15665,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650635543.331, "dur": 97.982, "args": { "External id": 15666,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650635545.175, "dur": 95.331, "args": { "External id": 15667,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650635647.232, "dur": 3.897, "args": { "External id": 15668,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650635649.222, "dur": 0.859, "args": { "External id": 15669,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650635658.687, "dur": 2.621, "args": { "External id": 15670,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650635670.175, "dur": 6.469, "args": { "External id": 15671,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650635672.417, "dur": 3.949, "args": { "External id": 15672,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650635810.294, "dur": 256.949, "args": { "External id": 15673,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650635815.402, "dur": 2.311, "args": { "External id": 15674,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650635819.258, "dur": 247.406, "args": { "External id": 15675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650635820.924, "dur": 0.429, "args": { "External id": 15676,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650635822.982, "dur": 27.344, "args": { "External id": 15677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650635852.151, "dur": 6.052, "args": { "External id": 15678,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650635857.033, "dur": 0.867, "args": { "External id": 15679,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650635859.253, "dur": 27.947, "args": { "External id": 15680,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650635860.651, "dur": 1.679, "args": { "External id": 15681,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650635863.933, "dur": 22.929, "args": { "External id": 15682,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650635869.937, "dur": 3.525, "args": { "External id": 15683,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650635888.829, "dur": 26.095, "args": { "External id": 15684,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650635916.986, "dur": 18.451, "args": { "External id": 15685,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650635938.292, "dur": 17.404, "args": { "External id": 15686,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650635957.297, "dur": 14.730, "args": { "External id": 15687,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650635973.951, "dur": 58.155, "args": { "External id": 15688,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650635975.970, "dur": 1.522, "args": { "External id": 15689,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650635980.017, "dur": 1.179, "args": { "External id": 15690,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650636036.607, "dur": 13.887, "args": { "External id": 15691,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650636052.169, "dur": 13.284, "args": { "External id": 15692,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650636075.472, "dur": 2.746, "args": { "External id": 15693,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636085.320, "dur": 4.664, "args": { "External id": 15694,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636088.376, "dur": 0.807, "args": { "External id": 15695,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650636168.208, "dur": 87.753, "args": { "External id": 15696,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636263.081, "dur": 9.275, "args": { "External id": 15697,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636268.441, "dur": 1.064, "args": { "External id": 15698,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650636274.040, "dur": 31.645, "args": { "External id": 15699,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650636311.905, "dur": 6.773, "args": { "External id": 15700,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650636313.817, "dur": 4.168, "args": { "External id": 15701,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636316.150, "dur": 1.589, "args": { "External id": 15702,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650636322.336, "dur": 50.187, "args": { "External id": 15703,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650636323.834, "dur": 48.188, "args": { "External id": 15704,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650636379.008, "dur": 18.086, "args": { "External id": 15705,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636403.218, "dur": 3.322, "args": { "External id": 15706,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636405.106, "dur": 0.632, "args": { "External id": 15707,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650636411.119, "dur": 57.176, "args": { "External id": 15708,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650636412.025, "dur": 5.783, "args": { "External id": 15709,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650636412.620, "dur": 4.660, "args": { "External id": 15710,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636416.506, "dur": 0.635, "args": { "External id": 15711,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650636418.638, "dur": 49.171, "args": { "External id": 15712,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650636423.744, "dur": 43.559, "args": { "External id": 15713,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636471.927, "dur": 3.990, "args": { "External id": 15714,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636473.684, "dur": 1.139, "args": { "External id": 15715,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650636482.726, "dur": 1.723, "args": { "External id": 15716,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650636494.710, "dur": 9.314, "args": { "External id": 15717,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650636497.036, "dur": 6.656, "args": { "External id": 15718,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650636599.510, "dur": 199.519, "args": { "External id": 15719,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650636601.882, "dur": 2.442, "args": { "External id": 15720,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650636605.639, "dur": 192.885, "args": { "External id": 15721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650636607.346, "dur": 0.330, "args": { "External id": 15722,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650636609.068, "dur": 26.299, "args": { "External id": 15723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650636641.764, "dur": 3.669, "args": { "External id": 15724,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636643.909, "dur": 1.249, "args": { "External id": 15725,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650636646.198, "dur": 26.305, "args": { "External id": 15726,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650636648.142, "dur": 3.718, "args": { "External id": 15727,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650636653.534, "dur": 18.730, "args": { "External id": 15728,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650636656.140, "dur": 3.693, "args": { "External id": 15729,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650636674.103, "dur": 21.605, "args": { "External id": 15730,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650636697.061, "dur": 15.543, "args": { "External id": 15731,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650636715.722, "dur": 14.810, "args": { "External id": 15732,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650636731.992, "dur": 14.188, "args": { "External id": 15733,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650636750.087, "dur": 20.333, "args": { "External id": 15734,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650636752.207, "dur": 1.626, "args": { "External id": 15735,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636755.866, "dur": 0.573, "args": { "External id": 15736,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650636771.871, "dur": 13.721, "args": { "External id": 15737,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650636786.576, "dur": 10.875, "args": { "External id": 15738,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650636805.774, "dur": 1.959, "args": { "External id": 15739,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636816.416, "dur": 3.214, "args": { "External id": 15740,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636818.436, "dur": 0.386, "args": { "External id": 15741,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650636889.605, "dur": 53.120, "args": { "External id": 15742,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650636947.030, "dur": 4.485, "args": { "External id": 15743,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650636949.723, "dur": 0.789, "args": { "External id": 15744,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650636952.695, "dur": 23.172, "args": { "External id": 15745,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650637017.852, "dur": 11.579, "args": { "External id": 15746,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650637020.221, "dur": 8.230, "args": { "External id": 15747,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637024.645, "dur": 3.306, "args": { "External id": 15748,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650637032.789, "dur": 51.312, "args": { "External id": 15749,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650637034.294, "dur": 49.167, "args": { "External id": 15750,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650637088.441, "dur": 17.005, "args": { "External id": 15751,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637111.904, "dur": 4.111, "args": { "External id": 15752,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637114.347, "dur": 0.758, "args": { "External id": 15753,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650637120.175, "dur": 50.525, "args": { "External id": 15754,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650637123.286, "dur": 3.641, "args": { "External id": 15755,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650637124.106, "dur": 2.280, "args": { "External id": 15756,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637125.420, "dur": 0.804, "args": { "External id": 15757,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650637127.744, "dur": 42.479, "args": { "External id": 15758,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650637128.197, "dur": 41.506, "args": { "External id": 15759,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637174.796, "dur": 3.755, "args": { "External id": 15760,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637176.843, "dur": 0.694, "args": { "External id": 15761,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650637184.378, "dur": 1.795, "args": { "External id": 15762,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637195.987, "dur": 6.334, "args": { "External id": 15763,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637198.271, "dur": 3.756, "args": { "External id": 15764,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650637311.737, "dur": 232.515, "args": { "External id": 15765,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637313.877, "dur": 2.870, "args": { "External id": 15766,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650637320.861, "dur": 222.977, "args": { "External id": 15767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650637322.214, "dur": 0.280, "args": { "External id": 15768,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650637323.521, "dur": 23.612, "args": { "External id": 15769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650637351.781, "dur": 4.905, "args": { "External id": 15770,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637353.670, "dur": 2.683, "args": { "External id": 15771,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650637357.898, "dur": 23.441, "args": { "External id": 15772,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637359.472, "dur": 1.987, "args": { "External id": 15773,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650637362.773, "dur": 18.331, "args": { "External id": 15774,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650637365.425, "dur": 2.754, "args": { "External id": 15775,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650637382.891, "dur": 22.718, "args": { "External id": 15776,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650637406.903, "dur": 13.705, "args": { "External id": 15777,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650637422.932, "dur": 16.039, "args": { "External id": 15778,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650637440.321, "dur": 13.312, "args": { "External id": 15779,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650637457.562, "dur": 23.802, "args": { "External id": 15780,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650637459.238, "dur": 1.696, "args": { "External id": 15781,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637463.276, "dur": 0.862, "args": { "External id": 15782,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650637482.565, "dur": 21.135, "args": { "External id": 15783,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650637504.910, "dur": 37.803, "args": { "External id": 15784,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650637550.747, "dur": 2.217, "args": { "External id": 15785,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637564.208, "dur": 3.990, "args": { "External id": 15786,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637566.632, "dur": 0.833, "args": { "External id": 15787,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650637633.232, "dur": 70.125, "args": { "External id": 15788,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637707.802, "dur": 6.572, "args": { "External id": 15789,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637710.237, "dur": 3.072, "args": { "External id": 15790,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650637715.532, "dur": 24.567, "args": { "External id": 15791,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650637745.308, "dur": 7.154, "args": { "External id": 15792,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650637746.627, "dur": 5.213, "args": { "External id": 15793,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637750.629, "dur": 0.975, "args": { "External id": 15794,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650637754.950, "dur": 41.650, "args": { "External id": 15795,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650637756.070, "dur": 40.024, "args": { "External id": 15796,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650637800.278, "dur": 16.243, "args": { "External id": 15797,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637821.793, "dur": 3.788, "args": { "External id": 15798,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637823.892, "dur": 0.869, "args": { "External id": 15799,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650637831.371, "dur": 48.131, "args": { "External id": 15800,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650637832.447, "dur": 4.028, "args": { "External id": 15801,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650637833.466, "dur": 2.533, "args": { "External id": 15802,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637835.150, "dur": 0.692, "args": { "External id": 15803,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650637837.225, "dur": 41.906, "args": { "External id": 15804,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650637837.740, "dur": 40.979, "args": { "External id": 15805,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650637885.005, "dur": 3.618, "args": { "External id": 15806,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650637886.860, "dur": 0.754, "args": { "External id": 15807,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650637893.907, "dur": 1.469, "args": { "External id": 15808,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637902.115, "dur": 6.242, "args": { "External id": 15809,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650637904.071, "dur": 4.053, "args": { "External id": 15810,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650638032.051, "dur": 216.462, "args": { "External id": 15811,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638034.692, "dur": 6.416, "args": { "External id": 15812,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650638042.815, "dur": 205.043, "args": { "External id": 15813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650638044.080, "dur": 0.314, "args": { "External id": 15814,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650638045.720, "dur": 24.564, "args": { "External id": 15815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650638071.892, "dur": 6.330, "args": { "External id": 15816,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638076.729, "dur": 1.150, "args": { "External id": 15817,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650638079.224, "dur": 24.884, "args": { "External id": 15818,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638080.264, "dur": 1.551, "args": { "External id": 15819,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650638082.931, "dur": 20.906, "args": { "External id": 15820,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650638087.913, "dur": 3.324, "args": { "External id": 15821,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650638105.379, "dur": 22.208, "args": { "External id": 15822,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650638128.975, "dur": 14.967, "args": { "External id": 15823,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650638147.196, "dur": 15.024, "args": { "External id": 15824,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650638163.507, "dur": 13.758, "args": { "External id": 15825,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650638178.624, "dur": 22.960, "args": { "External id": 15826,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650638180.601, "dur": 1.871, "args": { "External id": 15827,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638184.263, "dur": 2.957, "args": { "External id": 15828,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650638205.094, "dur": 13.643, "args": { "External id": 15829,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650638219.693, "dur": 26.000, "args": { "External id": 15830,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650638257.315, "dur": 2.647, "args": { "External id": 15831,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650638270.544, "dur": 3.994, "args": { "External id": 15832,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638272.991, "dur": 0.733, "args": { "External id": 15833,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650638349.929, "dur": 64.749, "args": { "External id": 15834,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650638419.103, "dur": 4.611, "args": { "External id": 15835,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638421.766, "dur": 0.846, "args": { "External id": 15836,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650638427.588, "dur": 25.919, "args": { "External id": 15837,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650638458.123, "dur": 6.564, "args": { "External id": 15838,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650638459.798, "dur": 4.233, "args": { "External id": 15839,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638462.345, "dur": 1.492, "args": { "External id": 15840,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650638467.438, "dur": 44.423, "args": { "External id": 15841,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650638468.841, "dur": 42.473, "args": { "External id": 15842,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650638515.785, "dur": 16.313, "args": { "External id": 15843,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650638539.864, "dur": 4.097, "args": { "External id": 15844,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638542.392, "dur": 0.715, "args": { "External id": 15845,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650638547.895, "dur": 50.749, "args": { "External id": 15846,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650638549.007, "dur": 3.721, "args": { "External id": 15847,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650638549.868, "dur": 2.370, "args": { "External id": 15848,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638551.331, "dur": 0.730, "args": { "External id": 15849,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650638555.534, "dur": 42.648, "args": { "External id": 15850,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650638555.970, "dur": 41.700, "args": { "External id": 15851,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650638602.460, "dur": 4.082, "args": { "External id": 15852,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638604.644, "dur": 0.818, "args": { "External id": 15853,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650638613.100, "dur": 1.608, "args": { "External id": 15854,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638623.056, "dur": 5.907, "args": { "External id": 15855,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638624.829, "dur": 3.871, "args": { "External id": 15856,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650638712.656, "dur": 229.316, "args": { "External id": 15857,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638716.821, "dur": 2.313, "args": { "External id": 15858,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650638721.003, "dur": 220.515, "args": { "External id": 15859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650638722.643, "dur": 0.265, "args": { "External id": 15860,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650638723.861, "dur": 21.230, "args": { "External id": 15861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650638746.686, "dur": 5.245, "args": { "External id": 15862,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638750.753, "dur": 0.838, "args": { "External id": 15863,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650638752.635, "dur": 24.300, "args": { "External id": 15864,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650638753.867, "dur": 1.509, "args": { "External id": 15865,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650638756.371, "dur": 20.310, "args": { "External id": 15866,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650638760.582, "dur": 2.973, "args": { "External id": 15867,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650638778.352, "dur": 20.554, "args": { "External id": 15868,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650638800.244, "dur": 16.913, "args": { "External id": 15869,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650638819.795, "dur": 15.018, "args": { "External id": 15870,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650638835.876, "dur": 13.280, "args": { "External id": 15871,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650638850.576, "dur": 62.697, "args": { "External id": 15872,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650638891.971, "dur": 2.222, "args": { "External id": 15873,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638898.300, "dur": 0.732, "args": { "External id": 15874,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650638914.618, "dur": 12.992, "args": { "External id": 15875,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650638928.584, "dur": 12.062, "args": { "External id": 15876,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650638947.995, "dur": 1.840, "args": { "External id": 15877,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650638958.482, "dur": 3.317, "args": { "External id": 15878,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650638960.571, "dur": 0.454, "args": { "External id": 15879,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639069.980, "dur": 62.490, "args": { "External id": 15880,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639137.953, "dur": 7.825, "args": { "External id": 15881,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639143.238, "dur": 0.989, "args": { "External id": 15882,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650639147.140, "dur": 27.280, "args": { "External id": 15883,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650639179.969, "dur": 7.798, "args": { "External id": 15884,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650639181.756, "dur": 5.262, "args": { "External id": 15885,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639183.776, "dur": 2.949, "args": { "External id": 15886,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650639190.762, "dur": 63.104, "args": { "External id": 15887,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639193.883, "dur": 59.142, "args": { "External id": 15888,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650639259.358, "dur": 19.114, "args": { "External id": 15889,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639284.267, "dur": 5.063, "args": { "External id": 15890,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639287.158, "dur": 1.107, "args": { "External id": 15891,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650639293.470, "dur": 55.373, "args": { "External id": 15892,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650639294.364, "dur": 6.512, "args": { "External id": 15893,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650639295.276, "dur": 4.944, "args": { "External id": 15894,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639299.038, "dur": 0.839, "args": { "External id": 15895,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650639301.508, "dur": 46.929, "args": { "External id": 15896,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639302.436, "dur": 45.524, "args": { "External id": 15897,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639352.692, "dur": 4.188, "args": { "External id": 15898,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639354.812, "dur": 1.001, "args": { "External id": 15899,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650639363.099, "dur": 1.746, "args": { "External id": 15900,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639375.159, "dur": 7.089, "args": { "External id": 15901,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639376.968, "dur": 5.010, "args": { "External id": 15902,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650639466.391, "dur": 191.112, "args": { "External id": 15903,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639468.719, "dur": 2.323, "args": { "External id": 15904,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650639474.933, "dur": 182.117, "args": { "External id": 15905,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650639476.249, "dur": 0.504, "args": { "External id": 15906,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650639479.999, "dur": 22.605, "args": { "External id": 15907,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650639504.312, "dur": 4.973, "args": { "External id": 15908,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639506.131, "dur": 2.914, "args": { "External id": 15909,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650639510.129, "dur": 22.381, "args": { "External id": 15910,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639511.377, "dur": 1.794, "args": { "External id": 15911,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650639514.471, "dur": 17.816, "args": { "External id": 15912,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650639516.804, "dur": 3.038, "args": { "External id": 15913,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650639533.883, "dur": 21.232, "args": { "External id": 15914,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650639556.506, "dur": 15.294, "args": { "External id": 15915,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650639574.852, "dur": 14.139, "args": { "External id": 15916,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650639592.459, "dur": 13.600, "args": { "External id": 15917,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650639607.468, "dur": 22.286, "args": { "External id": 15918,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650639609.457, "dur": 1.726, "args": { "External id": 15919,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639612.878, "dur": 2.785, "args": { "External id": 15920,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650639631.123, "dur": 12.803, "args": { "External id": 15921,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650639644.954, "dur": 10.978, "args": { "External id": 15922,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650639666.054, "dur": 1.715, "args": { "External id": 15923,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639676.148, "dur": 3.188, "args": { "External id": 15924,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639678.328, "dur": 0.281, "args": { "External id": 15925,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639740.425, "dur": 50.869, "args": { "External id": 15926,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639795.659, "dur": 4.664, "args": { "External id": 15927,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639798.336, "dur": 0.853, "args": { "External id": 15928,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650639801.604, "dur": 23.382, "args": { "External id": 15929,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650639829.480, "dur": 7.626, "args": { "External id": 15930,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650639831.162, "dur": 5.345, "args": { "External id": 15931,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639834.819, "dur": 1.445, "args": { "External id": 15932,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650639839.576, "dur": 39.932, "args": { "External id": 15933,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639840.604, "dur": 38.282, "args": { "External id": 15934,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650639883.090, "dur": 14.982, "args": { "External id": 15935,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639903.181, "dur": 4.047, "args": { "External id": 15936,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639905.599, "dur": 0.816, "args": { "External id": 15937,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650639913.037, "dur": 46.093, "args": { "External id": 15938,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650639913.746, "dur": 3.534, "args": { "External id": 15939,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650639914.541, "dur": 2.288, "args": { "External id": 15940,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639915.924, "dur": 0.751, "args": { "External id": 15941,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650639918.069, "dur": 40.750, "args": { "External id": 15942,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650639918.961, "dur": 39.158, "args": { "External id": 15943,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650639962.871, "dur": 3.960, "args": { "External id": 15944,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650639965.093, "dur": 0.767, "args": { "External id": 15945,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650639973.888, "dur": 1.475, "args": { "External id": 15946,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639982.267, "dur": 42.309, "args": { "External id": 15947,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650639983.938, "dur": 39.941, "args": { "External id": 15948,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650640112.862, "dur": 221.404, "args": { "External id": 15949,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640117.546, "dur": 2.305, "args": { "External id": 15950,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650640121.779, "dur": 211.922, "args": { "External id": 15951,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650640125.163, "dur": 0.270, "args": { "External id": 15952,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650640126.606, "dur": 21.928, "args": { "External id": 15953,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650640150.089, "dur": 5.499, "args": { "External id": 15954,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640154.178, "dur": 1.121, "args": { "External id": 15955,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650640163.927, "dur": 22.481, "args": { "External id": 15956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640165.333, "dur": 1.484, "args": { "External id": 15957,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650640167.824, "dur": 18.361, "args": { "External id": 15958,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650640170.419, "dur": 3.329, "args": { "External id": 15959,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650640187.910, "dur": 22.079, "args": { "External id": 15960,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650640211.230, "dur": 14.312, "args": { "External id": 15961,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650640241.383, "dur": 18.477, "args": { "External id": 15962,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650640263.326, "dur": 13.411, "args": { "External id": 15963,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650640278.618, "dur": 24.413, "args": { "External id": 15964,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650640283.032, "dur": 1.792, "args": { "External id": 15965,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640286.903, "dur": 1.107, "args": { "External id": 15966,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650640304.430, "dur": 13.045, "args": { "External id": 15967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650640318.644, "dur": 11.866, "args": { "External id": 15968,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650640341.377, "dur": 2.375, "args": { "External id": 15969,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650640352.323, "dur": 4.020, "args": { "External id": 15970,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640354.968, "dur": 0.510, "args": { "External id": 15971,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650640419.854, "dur": 56.656, "args": { "External id": 15972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650640481.196, "dur": 4.886, "args": { "External id": 15973,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640483.943, "dur": 1.246, "args": { "External id": 15974,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650640492.326, "dur": 23.029, "args": { "External id": 15975,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650640521.708, "dur": 7.674, "args": { "External id": 15976,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650640523.130, "dur": 5.615, "args": { "External id": 15977,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640525.277, "dur": 3.278, "args": { "External id": 15978,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650640531.913, "dur": 41.650, "args": { "External id": 15979,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650640533.435, "dur": 39.550, "args": { "External id": 15980,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650640577.244, "dur": 15.116, "args": { "External id": 15981,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650640597.374, "dur": 5.612, "args": { "External id": 15982,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640601.339, "dur": 0.697, "args": { "External id": 15983,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650640607.050, "dur": 49.951, "args": { "External id": 15984,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650640607.681, "dur": 4.157, "args": { "External id": 15985,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650640608.554, "dur": 2.568, "args": { "External id": 15986,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640610.415, "dur": 0.587, "args": { "External id": 15987,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650640612.599, "dur": 43.979, "args": { "External id": 15988,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650640615.418, "dur": 40.565, "args": { "External id": 15989,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650640660.532, "dur": 3.442, "args": { "External id": 15990,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640662.238, "dur": 0.742, "args": { "External id": 15991,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650640669.071, "dur": 1.442, "args": { "External id": 15992,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640677.606, "dur": 8.506, "args": { "External id": 15993,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640681.265, "dur": 4.609, "args": { "External id": 15994,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650640764.790, "dur": 180.744, "args": { "External id": 15995,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640767.039, "dur": 2.109, "args": { "External id": 15996,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650640773.352, "dur": 171.696, "args": { "External id": 15997,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650640774.543, "dur": 0.292, "args": { "External id": 15998,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650640776.435, "dur": 20.917, "args": { "External id": 15999,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650640798.706, "dur": 5.865, "args": { "External id": 16000,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640800.838, "dur": 3.386, "args": { "External id": 16001,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650640805.312, "dur": 23.071, "args": { "External id": 16002,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650640808.205, "dur": 1.716, "args": { "External id": 16003,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650640811.104, "dur": 17.043, "args": { "External id": 16004,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650640813.404, "dur": 2.360, "args": { "External id": 16005,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650640829.735, "dur": 19.032, "args": { "External id": 16006,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650640850.085, "dur": 14.053, "args": { "External id": 16007,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650640866.479, "dur": 14.221, "args": { "External id": 16008,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650640881.814, "dur": 12.033, "args": { "External id": 16009,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650640895.383, "dur": 22.456, "args": { "External id": 16010,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650640897.265, "dur": 2.252, "args": { "External id": 16011,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640903.416, "dur": 0.581, "args": { "External id": 16012,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650640919.253, "dur": 13.029, "args": { "External id": 16013,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650640933.203, "dur": 10.723, "args": { "External id": 16014,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650640951.429, "dur": 1.630, "args": { "External id": 16015,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650640961.022, "dur": 3.169, "args": { "External id": 16016,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650640963.094, "dur": 0.317, "args": { "External id": 16017,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650641070.003, "dur": 58.989, "args": { "External id": 16018,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641134.023, "dur": 9.458, "args": { "External id": 16019,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641138.905, "dur": 2.959, "args": { "External id": 16020,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650641145.105, "dur": 24.977, "args": { "External id": 16021,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650641174.910, "dur": 4.817, "args": { "External id": 16022,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650641176.203, "dur": 3.016, "args": { "External id": 16023,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641177.988, "dur": 1.016, "args": { "External id": 16024,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650641182.327, "dur": 44.374, "args": { "External id": 16025,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650641185.471, "dur": 40.630, "args": { "External id": 16026,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650641245.721, "dur": 19.550, "args": { "External id": 16027,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650641270.889, "dur": 26.447, "args": { "External id": 16028,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650641273.885, "dur": 23.087, "args": { "External id": 16029,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641279.456, "dur": 1.081, "args": { "External id": 16030,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650641303.000, "dur": 29.076, "args": { "External id": 16031,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650641305.015, "dur": 26.861, "args": { "External id": 16032,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641309.709, "dur": 4.506, "args": { "External id": 16033,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650641315.450, "dur": 15.907, "args": { "External id": 16034,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650641344.825, "dur": 6.765, "args": { "External id": 16035,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9530 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650641348.416, "dur": 2.899, "args": { "External id": 16036,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650641352.880, "dur": 1.274, "args": { "External id": 16037,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9532 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650641353.401, "dur": 0.627, "args": { "External id": 16038,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650641392.447, "dur": 21.055, "args": { "External id": 16039,"Sequence number": 246752, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650641415.427, "dur": 15.218, "args": { "External id": 16040,"Sequence number": 246753, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9535 } }, { "ph": "s", "id": 16, "pid": 1336754, "tid": 1336754, "ts": 1295650641415.427, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641436.836, "dur": 5.852, "args": { "External id": 16041,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641440.344, "dur": 1.112, "args": { "External id": 16042,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650641447.561, "dur": 6.701, "args": { "External id": 16043,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "2"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641452.035, "dur": 0.884, "args": { "External id": 16044,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641455.575, "dur": 3.013, "args": { "External id": 16045,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641457.232, "dur": 0.682, "args": { "External id": 16046,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "3"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641462.456, "dur": 8.404, "args": { "External id": 16047,"Sequence number": 246754, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9542 } }, { "ph": "s", "id": 15, "pid": 1336754, "tid": 1336754, "ts": 1295650641462.456, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641468.213, "dur": 1.319, "args": { "External id": 16048,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641471.733, "dur": 5.221, "args": { "External id": 16049,"Sequence number": 246755, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9544 } }, { "ph": "s", "id": 14, "pid": 1336754, "tid": 1336754, "ts": 1295650641471.733, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641475.404, "dur": 0.728, "args": { "External id": 16050,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650641478.081, "dur": 8.242, "args": { "External id": 16051,"Sequence number": 246756, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "2"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9546 } }, { "ph": "s", "id": 13, "pid": 1336754, "tid": 1336754, "ts": 1295650641478.081, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641484.355, "dur": 1.088, "args": { "External id": 16052,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650641487.503, "dur": 6.020, "args": { "External id": 16053,"Sequence number": 246757, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9548 } }, { "ph": "s", "id": 12, "pid": 1336754, "tid": 1336754, "ts": 1295650641487.503, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641491.600, "dur": 1.190, "args": { "External id": 16054,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "4096"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650641497.636, "dur": 29.379, "args": { "External id": 16055,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650641499.349, "dur": 27.466, "args": { "External id": 16056,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641501.719, "dur": 6.024, "args": { "External id": 16057,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650641504.016, "dur": 3.155, "args": { "External id": 16058,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650641508.917, "dur": 17.477, "args": { "External id": 16059,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650641553.957, "dur": 3.878, "args": { "External id": 16060,"Sequence number": 246758, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9555 } }, { "ph": "s", "id": 11, "pid": 1336754, "tid": 1336754, "ts": 1295650641553.957, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650641560.041, "dur": 3.256, "args": { "External id": 16061,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9556 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650641597.753, "dur": 43169.133, "args": { "External id": 16062,"Sequence number": 246759, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9557 } }, { "ph": "s", "id": 10, "pid": 1336754, "tid": 1336754, "ts": 1295650641597.753, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650641615.279, "dur": 25.923, "args": { "External id": 16063,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650641616.272, "dur": 24.687, "args": { "External id": 16064,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641617.577, "dur": 5.147, "args": { "External id": 16065,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650641619.136, "dur": 3.283, "args": { "External id": 16066,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650641623.287, "dur": 17.253, "args": { "External id": 16067,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641656.094, "dur": 25.647, "args": { "External id": 16068,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641657.670, "dur": 5.424, "args": { "External id": 16069,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641659.406, "dur": 3.422, "args": { "External id": 16070,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650641664.477, "dur": 16.986, "args": { "External id": 16071,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650641666.203, "dur": 14.725, "args": { "External id": 16072,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641685.170, "dur": 22.461, "args": { "External id": 16073,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650641686.003, "dur": 6.990, "args": { "External id": 16074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641689.754, "dur": 3.027, "args": { "External id": 16075,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650641693.736, "dur": 13.657, "args": { "External id": 16076,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650641694.579, "dur": 12.482, "args": { "External id": 16077,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 9572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650641713.255, "dur": 20.975, "args": { "External id": 16078,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 9573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650641715.081, "dur": 4.883, "args": { "External id": 16079,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650641720.612, "dur": 13.340, "args": { "External id": 16080,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 9575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650641721.579, "dur": 11.911, "args": { "External id": 16081,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1336754, "ts": 1295650641740.910, "dur": 21.025, "args": { "External id": 16082,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650641764.481, "dur": 49.846, "args": { "External id": 16083,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650641766.634, "dur": 47.187, "args": { "External id": 16084,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641771.316, "dur": 0.889, "args": { "External id": 16085,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650641773.463, "dur": 24.715, "args": { "External id": 16086,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650641774.770, "dur": 23.188, "args": { "External id": 16087,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 9582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650641779.250, "dur": 2.967, "args": { "External id": 16088,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650641783.081, "dur": 14.593, "args": { "External id": 16089,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 9584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295650641818.280, "dur": 37219.258, "args": { "External id": 16090,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295650641819.852, "dur": 37216.396, "args": { "External id": 16091,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 9586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679049.635, "dur": 8.914, "args": { "External id": 16092,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679055.967, "dur": 1.107, "args": { "External id": 16093,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650679063.795, "dur": 104.396, "args": { "External id": 16094,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650679065.243, "dur": 6.019, "args": { "External id": 16095,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650679067.371, "dur": 3.099, "args": { "External id": 16096,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679069.097, "dur": 1.089, "args": { "External id": 16097,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650679072.488, "dur": 95.118, "args": { "External id": 16098,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650679076.488, "dur": 90.213, "args": { "External id": 16099,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679171.708, "dur": 4.389, "args": { "External id": 16100,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679173.797, "dur": 0.806, "args": { "External id": 16101,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650679183.225, "dur": 2.397, "args": { "External id": 16102,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679194.778, "dur": 6.650, "args": { "External id": 16103,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679197.167, "dur": 3.966, "args": { "External id": 16104,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650679339.726, "dur": 211.726, "args": { "External id": 16105,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679342.963, "dur": 3.388, "args": { "External id": 16106,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650679348.586, "dur": 202.472, "args": { "External id": 16107,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650679352.834, "dur": 0.396, "args": { "External id": 16108,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650679354.846, "dur": 27.198, "args": { "External id": 16109,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650679384.006, "dur": 4.197, "args": { "External id": 16110,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679386.721, "dur": 1.030, "args": { "External id": 16111,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650679389.397, "dur": 31.725, "args": { "External id": 16112,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679393.455, "dur": 1.870, "args": { "External id": 16113,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650679399.413, "dur": 21.463, "args": { "External id": 16114,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650679403.325, "dur": 3.336, "args": { "External id": 16115,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650679422.560, "dur": 22.441, "args": { "External id": 16116,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650679446.554, "dur": 15.933, "args": { "External id": 16117,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650679465.272, "dur": 16.427, "args": { "External id": 16118,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650679483.145, "dur": 13.647, "args": { "External id": 16119,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650679498.924, "dur": 23.829, "args": { "External id": 16120,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650679500.411, "dur": 1.952, "args": { "External id": 16121,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679506.961, "dur": 1.076, "args": { "External id": 16122,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650679524.123, "dur": 13.097, "args": { "External id": 16123,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650679538.446, "dur": 11.693, "args": { "External id": 16124,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650679558.136, "dur": 1.912, "args": { "External id": 16125,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679566.348, "dur": 4.514, "args": { "External id": 16126,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679569.155, "dur": 0.699, "args": { "External id": 16127,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650679640.468, "dur": 66.125, "args": { "External id": 16128,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679712.259, "dur": 9.948, "args": { "External id": 16129,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679716.725, "dur": 3.276, "args": { "External id": 16130,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650679723.552, "dur": 24.881, "args": { "External id": 16131,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650679753.527, "dur": 6.513, "args": { "External id": 16132,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650679755.459, "dur": 3.899, "args": { "External id": 16133,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679757.888, "dur": 0.928, "args": { "External id": 16134,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650679763.069, "dur": 47.148, "args": { "External id": 16135,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650679766.836, "dur": 42.704, "args": { "External id": 16136,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650679814.321, "dur": 16.854, "args": { "External id": 16137,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679837.472, "dur": 3.798, "args": { "External id": 16138,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679839.345, "dur": 0.947, "args": { "External id": 16139,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650679845.506, "dur": 51.492, "args": { "External id": 16140,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650679846.849, "dur": 6.262, "args": { "External id": 16141,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650679847.733, "dur": 4.807, "args": { "External id": 16142,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679851.478, "dur": 0.916, "args": { "External id": 16143,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650679853.970, "dur": 42.730, "args": { "External id": 16144,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650679854.776, "dur": 41.242, "args": { "External id": 16145,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650679900.980, "dur": 3.698, "args": { "External id": 16146,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650679902.833, "dur": 0.723, "args": { "External id": 16147,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650679910.275, "dur": 1.519, "args": { "External id": 16148,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679921.251, "dur": 6.390, "args": { "External id": 16149,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650679923.564, "dur": 3.819, "args": { "External id": 16150,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650680056.214, "dur": 221.027, "args": { "External id": 16151,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680058.715, "dur": 5.592, "args": { "External id": 16152,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650680066.328, "dur": 210.422, "args": { "External id": 16153,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650680068.208, "dur": 0.481, "args": { "External id": 16154,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650680072.505, "dur": 25.489, "args": { "External id": 16155,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650680099.558, "dur": 6.253, "args": { "External id": 16156,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680104.422, "dur": 1.074, "args": { "External id": 16157,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650680107.010, "dur": 22.815, "args": { "External id": 16158,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680108.477, "dur": 1.713, "args": { "External id": 16159,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650680111.395, "dur": 18.209, "args": { "External id": 16160,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650680113.795, "dur": 3.346, "args": { "External id": 16161,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650680131.296, "dur": 23.091, "args": { "External id": 16162,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650680155.718, "dur": 14.060, "args": { "External id": 16163,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650680172.492, "dur": 15.907, "args": { "External id": 16164,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650680191.680, "dur": 13.344, "args": { "External id": 16165,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650680206.547, "dur": 37.382, "args": { "External id": 16166,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650680211.384, "dur": 1.608, "args": { "External id": 16167,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680214.898, "dur": 0.925, "args": { "External id": 16168,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650680246.437, "dur": 15.296, "args": { "External id": 16169,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650680262.723, "dur": 12.631, "args": { "External id": 16170,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650680287.420, "dur": 2.502, "args": { "External id": 16171,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650680299.637, "dur": 3.870, "args": { "External id": 16172,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680302.089, "dur": 0.611, "args": { "External id": 16173,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650680374.846, "dur": 60.074, "args": { "External id": 16174,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650680439.778, "dur": 4.710, "args": { "External id": 16175,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680442.645, "dur": 0.739, "args": { "External id": 16176,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650680445.841, "dur": 25.019, "args": { "External id": 16177,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650680475.305, "dur": 7.309, "args": { "External id": 16178,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650680476.727, "dur": 5.085, "args": { "External id": 16179,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680480.442, "dur": 1.133, "args": { "External id": 16180,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650680485.248, "dur": 40.748, "args": { "External id": 16181,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650680486.314, "dur": 39.081, "args": { "External id": 16182,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650680529.521, "dur": 15.193, "args": { "External id": 16183,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650680550.234, "dur": 4.025, "args": { "External id": 16184,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680552.666, "dur": 0.765, "args": { "External id": 16185,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650680560.045, "dur": 47.980, "args": { "External id": 16186,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650680561.105, "dur": 3.650, "args": { "External id": 16187,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650680561.980, "dur": 2.248, "args": { "External id": 16188,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680563.426, "dur": 0.659, "args": { "External id": 16189,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650680565.674, "dur": 42.011, "args": { "External id": 16190,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650680566.270, "dur": 40.893, "args": { "External id": 16191,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650680632.654, "dur": 4.462, "args": { "External id": 16192,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680635.076, "dur": 0.836, "args": { "External id": 16193,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650680644.899, "dur": 1.560, "args": { "External id": 16194,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680654.150, "dur": 8.533, "args": { "External id": 16195,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680656.366, "dur": 6.052, "args": { "External id": 16196,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650680745.786, "dur": 188.795, "args": { "External id": 16197,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680747.935, "dur": 2.270, "args": { "External id": 16198,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650680752.273, "dur": 181.773, "args": { "External id": 16199,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650680753.968, "dur": 0.690, "args": { "External id": 16200,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650680757.481, "dur": 26.308, "args": { "External id": 16201,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650680785.432, "dur": 3.139, "args": { "External id": 16202,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680787.348, "dur": 0.977, "args": { "External id": 16203,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650680789.485, "dur": 25.349, "args": { "External id": 16204,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650680790.939, "dur": 1.718, "args": { "External id": 16205,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650680793.871, "dur": 20.653, "args": { "External id": 16206,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650680798.564, "dur": 2.660, "args": { "External id": 16207,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650680816.404, "dur": 20.047, "args": { "External id": 16208,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650680838.158, "dur": 14.183, "args": { "External id": 16209,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650680854.888, "dur": 13.900, "args": { "External id": 16210,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650680872.442, "dur": 13.270, "args": { "External id": 16211,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650680887.139, "dur": 19.697, "args": { "External id": 16212,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650680889.126, "dur": 1.557, "args": { "External id": 16213,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680892.340, "dur": 0.745, "args": { "External id": 16214,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650680908.168, "dur": 12.412, "args": { "External id": 16215,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650680921.706, "dur": 11.469, "args": { "External id": 16216,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650680942.225, "dur": 1.571, "args": { "External id": 16217,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650680951.586, "dur": 3.658, "args": { "External id": 16218,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650680953.903, "dur": 0.546, "args": { "External id": 16219,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681061.837, "dur": 86.925, "args": { "External id": 16220,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681154.144, "dur": 5.706, "args": { "External id": 16221,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681157.079, "dur": 1.175, "args": { "External id": 16222,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650681161.240, "dur": 36.986, "args": { "External id": 16223,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650681203.247, "dur": 7.735, "args": { "External id": 16224,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650681206.799, "dur": 3.582, "args": { "External id": 16225,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681208.943, "dur": 1.198, "args": { "External id": 16226,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650681216.787, "dur": 70.753, "args": { "External id": 16227,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681218.182, "dur": 68.357, "args": { "External id": 16228,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650681293.116, "dur": 17.978, "args": { "External id": 16229,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681317.799, "dur": 6.780, "args": { "External id": 16230,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681322.557, "dur": 1.065, "args": { "External id": 16231,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650681328.701, "dur": 50.360, "args": { "External id": 16232,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650681329.551, "dur": 3.689, "args": { "External id": 16233,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650681330.477, "dur": 2.247, "args": { "External id": 16234,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681331.839, "dur": 0.740, "args": { "External id": 16235,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650681333.969, "dur": 44.624, "args": { "External id": 16236,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681334.527, "dur": 43.606, "args": { "External id": 16237,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681385.026, "dur": 6.107, "args": { "External id": 16238,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681387.280, "dur": 2.668, "args": { "External id": 16239,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650681397.458, "dur": 1.465, "args": { "External id": 16240,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650681406.504, "dur": 6.306, "args": { "External id": 16241,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650681408.441, "dur": 4.108, "args": { "External id": 16242,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650681507.111, "dur": 192.886, "args": { "External id": 16243,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650681509.572, "dur": 2.269, "args": { "External id": 16244,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650681513.497, "dur": 186.070, "args": { "External id": 16245,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650681514.681, "dur": 0.424, "args": { "External id": 16246,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650681516.085, "dur": 24.891, "args": { "External id": 16247,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650681542.331, "dur": 3.347, "args": { "External id": 16248,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681544.423, "dur": 0.978, "args": { "External id": 16249,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650681546.632, "dur": 27.392, "args": { "External id": 16250,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650681547.952, "dur": 1.893, "args": { "External id": 16251,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650681553.186, "dur": 20.454, "args": { "External id": 16252,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650681558.220, "dur": 2.743, "args": { "External id": 16253,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650681575.747, "dur": 22.257, "args": { "External id": 16254,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650681599.619, "dur": 13.875, "args": { "External id": 16255,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650681616.313, "dur": 16.337, "args": { "External id": 16256,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650681634.077, "dur": 12.900, "args": { "External id": 16257,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650681648.538, "dur": 22.994, "args": { "External id": 16258,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650681650.224, "dur": 2.363, "args": { "External id": 16259,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681656.104, "dur": 0.838, "args": { "External id": 16260,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650681672.800, "dur": 12.928, "args": { "External id": 16261,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650681686.746, "dur": 11.602, "args": { "External id": 16262,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650681706.570, "dur": 1.963, "args": { "External id": 16263,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681717.011, "dur": 3.788, "args": { "External id": 16264,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681719.345, "dur": 0.653, "args": { "External id": 16265,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681784.909, "dur": 51.596, "args": { "External id": 16266,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681841.082, "dur": 7.316, "args": { "External id": 16267,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681845.801, "dur": 1.594, "args": { "External id": 16268,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650681849.488, "dur": 24.330, "args": { "External id": 16269,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650681878.469, "dur": 4.966, "args": { "External id": 16270,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650681880.005, "dur": 2.773, "args": { "External id": 16271,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681881.888, "dur": 0.697, "args": { "External id": 16272,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650681885.923, "dur": 40.751, "args": { "External id": 16273,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681887.094, "dur": 38.906, "args": { "External id": 16274,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650681932.240, "dur": 15.011, "args": { "External id": 16275,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650681952.710, "dur": 4.067, "args": { "External id": 16276,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681955.294, "dur": 0.603, "args": { "External id": 16277,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650681960.107, "dur": 95.171, "args": { "External id": 16278,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650681960.831, "dur": 8.934, "args": { "External id": 16279,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650681961.918, "dur": 7.243, "args": { "External id": 16280,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650681968.286, "dur": 0.736, "args": { "External id": 16281,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650681970.492, "dur": 84.134, "args": { "External id": 16282,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650681971.233, "dur": 82.320, "args": { "External id": 16283,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650682070.096, "dur": 5.136, "args": { "External id": 16284,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682072.867, "dur": 1.005, "args": { "External id": 16285,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650682081.956, "dur": 1.648, "args": { "External id": 16286,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682091.183, "dur": 8.508, "args": { "External id": 16287,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682095.331, "dur": 4.076, "args": { "External id": 16288,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650682185.420, "dur": 211.120, "args": { "External id": 16289,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682189.840, "dur": 2.427, "args": { "External id": 16290,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650682193.889, "dur": 202.238, "args": { "External id": 16291,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650682194.979, "dur": 0.487, "args": { "External id": 16292,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650682196.432, "dur": 23.157, "args": { "External id": 16293,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650682221.189, "dur": 5.945, "args": { "External id": 16294,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682226.016, "dur": 0.717, "args": { "External id": 16295,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650682241.131, "dur": 28.809, "args": { "External id": 16296,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682242.730, "dur": 2.286, "args": { "External id": 16297,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650682248.922, "dur": 20.698, "args": { "External id": 16298,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650682251.754, "dur": 3.574, "args": { "External id": 16299,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650682271.110, "dur": 21.826, "args": { "External id": 16300,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650682294.425, "dur": 17.900, "args": { "External id": 16301,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650682314.673, "dur": 14.760, "args": { "External id": 16302,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650682330.763, "dur": 13.880, "args": { "External id": 16303,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650682345.991, "dur": 22.430, "args": { "External id": 16304,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650682347.983, "dur": 2.025, "args": { "External id": 16305,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682353.750, "dur": 0.769, "args": { "External id": 16306,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650682369.867, "dur": 13.530, "args": { "External id": 16307,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650682384.490, "dur": 10.674, "args": { "External id": 16308,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650682404.035, "dur": 2.085, "args": { "External id": 16309,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650682414.773, "dur": 3.476, "args": { "External id": 16310,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682417.038, "dur": 0.453, "args": { "External id": 16311,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650682484.400, "dur": 56.312, "args": { "External id": 16312,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650682544.786, "dur": 7.200, "args": { "External id": 16313,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682549.962, "dur": 0.987, "args": { "External id": 16314,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650682553.285, "dur": 25.412, "args": { "External id": 16315,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650682583.669, "dur": 5.167, "args": { "External id": 16316,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650682585.269, "dur": 2.997, "args": { "External id": 16317,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682587.043, "dur": 1.058, "args": { "External id": 16318,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650682591.578, "dur": 42.683, "args": { "External id": 16319,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650682594.696, "dur": 39.031, "args": { "External id": 16320,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650682638.028, "dur": 14.795, "args": { "External id": 16321,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650682658.572, "dur": 3.715, "args": { "External id": 16322,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682660.718, "dur": 0.719, "args": { "External id": 16323,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650682666.029, "dur": 62.564, "args": { "External id": 16324,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650682680.242, "dur": 6.119, "args": { "External id": 16325,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650682683.327, "dur": 2.543, "args": { "External id": 16326,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682685.019, "dur": 0.732, "args": { "External id": 16327,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650682687.142, "dur": 41.106, "args": { "External id": 16328,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650682687.761, "dur": 40.004, "args": { "External id": 16329,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650682732.130, "dur": 3.651, "args": { "External id": 16330,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682734.219, "dur": 0.484, "args": { "External id": 16331,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650682742.772, "dur": 1.353, "args": { "External id": 16332,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682750.816, "dur": 7.954, "args": { "External id": 16333,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682752.559, "dur": 5.920, "args": { "External id": 16334,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650682838.455, "dur": 228.013, "args": { "External id": 16335,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682840.893, "dur": 2.161, "args": { "External id": 16336,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650682844.773, "dur": 221.279, "args": { "External id": 16337,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650682848.429, "dur": 0.298, "args": { "External id": 16338,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650682849.795, "dur": 24.392, "args": { "External id": 16339,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650682875.831, "dur": 2.664, "args": { "External id": 16340,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682877.507, "dur": 0.740, "args": { "External id": 16341,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650682879.244, "dur": 23.367, "args": { "External id": 16342,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650682880.845, "dur": 1.451, "args": { "External id": 16343,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650682883.366, "dur": 18.952, "args": { "External id": 16344,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650682887.559, "dur": 2.389, "args": { "External id": 16345,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650682903.956, "dur": 19.477, "args": { "External id": 16346,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650682924.804, "dur": 12.973, "args": { "External id": 16347,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650682941.976, "dur": 15.601, "args": { "External id": 16348,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650682958.875, "dur": 13.082, "args": { "External id": 16349,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650682973.468, "dur": 58.523, "args": { "External id": 16350,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650682975.348, "dur": 1.903, "args": { "External id": 16351,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650682979.288, "dur": 0.873, "args": { "External id": 16352,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650683034.623, "dur": 13.755, "args": { "External id": 16353,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650683051.684, "dur": 12.926, "args": { "External id": 16354,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650683073.938, "dur": 2.211, "args": { "External id": 16355,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683084.623, "dur": 3.825, "args": { "External id": 16356,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683087.081, "dur": 0.651, "args": { "External id": 16357,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650683151.852, "dur": 54.143, "args": { "External id": 16358,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683210.775, "dur": 4.992, "args": { "External id": 16359,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683213.201, "dur": 1.515, "args": { "External id": 16360,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650683216.927, "dur": 42.260, "args": { "External id": 16361,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650683265.157, "dur": 8.028, "args": { "External id": 16362,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650683269.201, "dur": 3.139, "args": { "External id": 16363,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683271.377, "dur": 0.749, "args": { "External id": 16364,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650683276.096, "dur": 44.790, "args": { "External id": 16365,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650683277.332, "dur": 42.753, "args": { "External id": 16366,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650683324.275, "dur": 17.344, "args": { "External id": 16367,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683347.553, "dur": 6.179, "args": { "External id": 16368,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683351.978, "dur": 0.902, "args": { "External id": 16369,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650683357.452, "dur": 50.245, "args": { "External id": 16370,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650683358.386, "dur": 6.205, "args": { "External id": 16371,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650683359.379, "dur": 4.659, "args": { "External id": 16372,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683360.694, "dur": 2.885, "args": { "External id": 16373,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650683365.160, "dur": 42.214, "args": { "External id": 16374,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650683365.766, "dur": 41.040, "args": { "External id": 16375,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683411.463, "dur": 4.076, "args": { "External id": 16376,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683413.821, "dur": 0.594, "args": { "External id": 16377,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650683423.012, "dur": 1.426, "args": { "External id": 16378,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650683431.236, "dur": 6.619, "args": { "External id": 16379,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650683433.302, "dur": 4.292, "args": { "External id": 16380,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650683515.862, "dur": 217.767, "args": { "External id": 16381,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650683518.443, "dur": 2.099, "args": { "External id": 16382,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650683523.794, "dur": 209.395, "args": { "External id": 16383,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650683524.803, "dur": 0.267, "args": { "External id": 16384,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650683560.325, "dur": 22.825, "args": { "External id": 16385,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650683584.941, "dur": 3.032, "args": { "External id": 16386,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683586.550, "dur": 1.143, "args": { "External id": 16387,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650683588.824, "dur": 22.941, "args": { "External id": 16388,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650683589.711, "dur": 3.211, "args": { "External id": 16389,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650683593.984, "dur": 17.461, "args": { "External id": 16390,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650683596.166, "dur": 3.220, "args": { "External id": 16391,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650683612.921, "dur": 20.639, "args": { "External id": 16392,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650683634.838, "dur": 14.356, "args": { "External id": 16393,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650683653.567, "dur": 14.735, "args": { "External id": 16394,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650683669.448, "dur": 13.680, "args": { "External id": 16395,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650683684.517, "dur": 19.376, "args": { "External id": 16396,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650683686.156, "dur": 1.829, "args": { "External id": 16397,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683689.609, "dur": 0.519, "args": { "External id": 16398,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650683705.192, "dur": 13.315, "args": { "External id": 16399,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650683721.576, "dur": 10.820, "args": { "External id": 16400,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650683739.724, "dur": 1.425, "args": { "External id": 16401,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683748.680, "dur": 3.151, "args": { "External id": 16402,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683750.557, "dur": 0.543, "args": { "External id": 16403,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650683811.588, "dur": 49.083, "args": { "External id": 16404,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683865.224, "dur": 4.101, "args": { "External id": 16405,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683867.545, "dur": 0.663, "args": { "External id": 16406,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650683870.440, "dur": 23.742, "args": { "External id": 16407,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650683900.443, "dur": 6.219, "args": { "External id": 16408,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650683901.482, "dur": 4.568, "args": { "External id": 16409,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683903.043, "dur": 2.824, "args": { "External id": 16410,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650683908.723, "dur": 39.780, "args": { "External id": 16411,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650683909.503, "dur": 38.125, "args": { "External id": 16412,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650683951.555, "dur": 15.252, "args": { "External id": 16413,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650683971.660, "dur": 5.578, "args": { "External id": 16414,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683975.722, "dur": 0.734, "args": { "External id": 16415,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650683980.585, "dur": 90.361, "args": { "External id": 16416,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 9911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650683981.018, "dur": 3.027, "args": { "External id": 16417,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650683981.548, "dur": 1.829, "args": { "External id": 16418,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 9913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650683982.640, "dur": 0.598, "args": { "External id": 16419,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 9914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650684020.246, "dur": 50.106, "args": { "External id": 16420,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650684023.167, "dur": 46.455, "args": { "External id": 16421,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 9916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684075.615, "dur": 4.547, "args": { "External id": 16422,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684078.081, "dur": 0.804, "args": { "External id": 16423,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650684086.375, "dur": 1.402, "args": { "External id": 16424,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 9919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650684094.937, "dur": 8.789, "args": { "External id": 16425,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 9920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650684098.575, "dur": 4.876, "args": { "External id": 16426,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650684182.667, "dur": 222.402, "args": { "External id": 16427,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650684184.561, "dur": 2.353, "args": { "External id": 16428,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650684190.605, "dur": 214.074, "args": { "External id": 16429,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 9924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650684191.602, "dur": 0.461, "args": { "External id": 16430,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650684193.312, "dur": 22.939, "args": { "External id": 16431,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 9926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650684217.744, "dur": 5.201, "args": { "External id": 16432,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 9927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684220.117, "dur": 2.527, "args": { "External id": 16433,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 9928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650684223.788, "dur": 50.102, "args": { "External id": 16434,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650684248.065, "dur": 2.440, "args": { "External id": 16435,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650684252.661, "dur": 20.924, "args": { "External id": 16436,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 9931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650684255.354, "dur": 3.382, "args": { "External id": 16437,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650684275.367, "dur": 21.318, "args": { "External id": 16438,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650684298.038, "dur": 17.396, "args": { "External id": 16439,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650684318.149, "dur": 15.393, "args": { "External id": 16440,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 9935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650684334.624, "dur": 14.019, "args": { "External id": 16441,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 9936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650684350.174, "dur": 26.509, "args": { "External id": 16442,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 9937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650684352.031, "dur": 1.892, "args": { "External id": 16443,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 9938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684358.170, "dur": 1.073, "args": { "External id": 16444,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 9939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650684378.072, "dur": 12.932, "args": { "External id": 16445,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 9940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650684391.951, "dur": 11.809, "args": { "External id": 16446,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 9941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650684411.749, "dur": 2.041, "args": { "External id": 16447,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 9942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684421.672, "dur": 3.416, "args": { "External id": 16448,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 9943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684423.806, "dur": 0.569, "args": { "External id": 16449,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650684487.697, "dur": 53.449, "args": { "External id": 16450,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 9945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684545.917, "dur": 6.935, "args": { "External id": 16451,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 9946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684550.824, "dur": 0.960, "args": { "External id": 16452,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 9947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650684553.958, "dur": 25.998, "args": { "External id": 16453,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 9948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650684584.254, "dur": 5.189, "args": { "External id": 16454,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 9949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650684585.572, "dur": 3.248, "args": { "External id": 16455,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 9950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684587.563, "dur": 1.083, "args": { "External id": 16456,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 9951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650684592.036, "dur": 43.825, "args": { "External id": 16457,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650684595.321, "dur": 39.949, "args": { "External id": 16458,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 9953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650684639.180, "dur": 16.640, "args": { "External id": 16459,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650684660.772, "dur": 27.654, "args": { "External id": 16460,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 9955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650684663.078, "dur": 24.911, "args": { "External id": 16461,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 9956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684668.621, "dur": 2.794, "args": { "External id": 16462,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 9957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650684693.997, "dur": 29.607, "args": { "External id": 16463,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 9958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650684695.816, "dur": 27.586, "args": { "External id": 16464,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 9959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684700.337, "dur": 4.725, "args": { "External id": 16465,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650684708.433, "dur": 14.514, "args": { "External id": 16466,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 9961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650684735.298, "dur": 5.057, "args": { "External id": 16467,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9962 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650684737.088, "dur": 2.980, "args": { "External id": 16468,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650684741.789, "dur": 1.410, "args": { "External id": 16469,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9964 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650684742.680, "dur": 0.441, "args": { "External id": 16470,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 9965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650684783.086, "dur": 22.785, "args": { "External id": 16471,"Sequence number": 246760, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650684807.589, "dur": 16.016, "args": { "External id": 16472,"Sequence number": 246761, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 9967 } }, { "ph": "s", "id": 9, "pid": 1336754, "tid": 1336754, "ts": 1295650684807.589, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684830.577, "dur": 5.894, "args": { "External id": 16473,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], [], []], "Input Dims": [[16, 4, 4096], [], [], [], []], "Ev Idx": 9968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684834.097, "dur": 1.229, "args": { "External id": 16474,"Record function id": 0, "Concrete Inputs": ["", "[16, 4, 4096]", "[8192, 1, 1]", "1"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650684844.717, "dur": 6.851, "args": { "External id": 16475,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "3"], "Input type": ["long int", "Scalar", "Scalar"], "Input Strides": [[8192, 1, 1], [], []], "Input Dims": [[16, 4, 4096], [], []], "Ev Idx": 9970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684849.088, "dur": 1.198, "args": { "External id": 16476,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1, 1], [], [], []], "Input Dims": [[16, 4, 4096], [], [], []], "Ev Idx": 9971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684852.768, "dur": 3.032, "args": { "External id": 16477,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], []], "Ev Idx": 9972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684854.280, "dur": 0.982, "args": { "External id": 16478,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096]", "[8192, 1]", "4"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[8192, 1], [], [], []], "Input Dims": [[16, 4096], [], [], []], "Ev Idx": 9973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684862.012, "dur": 5.650, "args": { "External id": 16479,"Sequence number": 246762, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9974 } }, { "ph": "s", "id": 8, "pid": 1336754, "tid": 1336754, "ts": 1295650684862.012, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684865.211, "dur": 1.103, "args": { "External id": 16480,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684868.743, "dur": 5.599, "args": { "External id": 16481,"Sequence number": 246763, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "1", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], [], []], "Ev Idx": 9976 } }, { "ph": "s", "id": 7, "pid": 1336754, "tid": 1336754, "ts": 1295650684868.743, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684872.541, "dur": 1.039, "args": { "External id": 16482,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 4, 2048]", "[33554432, 8192, 2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::select", "pid": 1336754, "tid": 1336754, "ts": 1295650684875.383, "dur": 7.513, "args": { "External id": 16483,"Sequence number": 246764, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "3"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], []], "Input Dims": [[16, 4096, 4, 2048], [], []], "Ev Idx": 9978 } }, { "ph": "s", "id": 6, "pid": 1336754, "tid": 1336754, "ts": 1295650684875.383, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684881.229, "dur": 0.848, "args": { "External id": 16484,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 2048, 1], [], [], []], "Input Dims": [[16, 4096, 4, 2048], [], [], []], "Ev Idx": 9979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650684883.959, "dur": 7.115, "args": { "External id": 16485,"Sequence number": 246765, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "2", "0", "9223372036854775807", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], [], []], "Ev Idx": 9980 } }, { "ph": "s", "id": 5, "pid": 1336754, "tid": 1336754, "ts": 1295650684883.959, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650684887.574, "dur": 2.689, "args": { "External id": 16486,"Record function id": 0, "Concrete Inputs": ["", "[16, 4096, 2048]", "[33554432, 8192, 1]", "6144"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[33554432, 8192, 1], [], [], []], "Input Dims": [[16, 4096, 2048], [], [], []], "Ev Idx": 9981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650684894.991, "dur": 30.960, "args": { "External id": 16487,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650684896.740, "dur": 29.009, "args": { "External id": 16488,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["long int", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650684899.486, "dur": 6.423, "args": { "External id": 16489,"Record function id": 0, "Concrete Inputs": ["", "4", "0", "", "", "0"], "Input type": ["long int", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[16, 4096], [], [], [], [], []], "Ev Idx": 9984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650684902.191, "dur": 3.121, "args": { "External id": 16490,"Record function id": 0, "Concrete Inputs": ["[16, 4096]", "4", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650684906.774, "dur": 18.570, "args": { "External id": 16491,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "long int", "Scalar"], "Input Strides": [[4096, 1], [8192, 1], []], "Input Dims": [[16, 4096], [16, 4096], []], "Ev Idx": 9986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650684951.541, "dur": 5.555, "args": { "External id": 16492,"Sequence number": 246766, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1, 2048]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[33554432, 8192, 1], []], "Input Dims": [[16, 4096, 2048], []], "Ev Idx": 9987 } }, { "ph": "s", "id": 4, "pid": 1336754, "tid": 1336754, "ts": 1295650684951.541, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650684959.552, "dur": 1.328, "args": { "External id": 16493,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["long int", "ScalarList"], "Input Strides": [[4096, 1], []], "Input Dims": [[16, 4096], []], "Ev Idx": 9988 } }, { "ph": "X", "cat": "cpu_op", "name": "FusedLinearCrossEntropyFunction", "pid": 1336754, "tid": 1336754, "ts": 1295650685032.484, "dur": 44173.111, "args": { "External id": 16494,"Sequence number": 246767, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "", "", "-100", "0.", "1.", "8"], "Input type": ["c10::BFloat16", "long int", "c10::BFloat16", "", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[8192, 1], [1], [2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [65536], [32000, 2048], [], [], [], [], []], "Ev Idx": 9989 } }, { "ph": "s", "id": 3, "pid": 1336754, "tid": 1336754, "ts": 1295650685032.484, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::contiguous", "pid": 1336754, "tid": 1336754, "ts": 1295650685049.745, "dur": 33.768, "args": { "External id": 16495,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295650685050.788, "dur": 32.507, "args": { "External id": 16496,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[8192, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650685052.724, "dur": 9.067, "args": { "External id": 16497,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "", "0"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[8192, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650685054.439, "dur": 6.556, "args": { "External id": 16498,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "15", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650685062.918, "dur": 19.932, "args": { "External id": 16499,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [8192, 1], []], "Input Dims": [[65536, 2048], [65536, 2048], []], "Ev Idx": 9994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650685099.978, "dur": 27.266, "args": { "External id": 16500,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", ""], "Input type": ["c10::BFloat16", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650685101.201, "dur": 8.009, "args": { "External id": 16501,"Record function id": 0, "Concrete Inputs": ["", "15", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], [], []], "Ev Idx": 9996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650685104.913, "dur": 4.030, "args": { "External id": 16502,"Record function id": 0, "Concrete Inputs": ["[65536, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 9997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650685110.559, "dur": 16.452, "args": { "External id": 16503,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 9998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650685112.574, "dur": 13.932, "args": { "External id": 16504,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[65536, 2048], []], "Ev Idx": 9999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros_like", "pid": 1336754, "tid": 1336754, "ts": 1295650685130.683, "dur": 19.538, "args": { "External id": 16505,"Record function id": 0, "Concrete Inputs": ["", "6", "", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650685131.776, "dur": 4.445, "args": { "External id": 16506,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "False", ""], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650685133.307, "dur": 2.647, "args": { "External id": 16507,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650685136.863, "dur": 13.144, "args": { "External id": 16508,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650685137.466, "dur": 12.257, "args": { "External id": 16509,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[2048, 1], []], "Input Dims": [[32000, 2048], []], "Ev Idx": 10004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295650685156.276, "dur": 18.938, "args": { "External id": 16510,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False"], "Input type": ["ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650685159.970, "dur": 3.049, "args": { "External id": 16511,"Record function id": 0, "Concrete Inputs": ["[65536]", "6", "", "", "False", ""], "Input type": ["ScalarList", "Scalar", "", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295650685163.610, "dur": 11.322, "args": { "External id": 16512,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[65536]], "Ev Idx": 10007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650685164.419, "dur": 10.245, "args": { "External id": 16513,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1336754, "ts": 1295650685179.685, "dur": 23.229, "args": { "External id": 16514,"Record function id": 0, "Concrete Inputs": ["", "-100"], "Input type": ["long int", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650685205.736, "dur": 73.508, "args": { "External id": 16515,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["bool", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650685207.862, "dur": 70.901, "args": { "External id": 16516,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["bool", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650685215.410, "dur": 1.011, "args": { "External id": 16517,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["long int", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650685217.862, "dur": 42.223, "args": { "External id": 16518,"Record function id": 0, "Concrete Inputs": ["", "4", "False", "False", ""], "Input type": ["bool", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650685219.646, "dur": 39.995, "args": { "External id": 16519,"Record function id": 0, "Concrete Inputs": ["", "4", "", "", "", "False", ""], "Input type": ["bool", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[1], [], [], [], [], [], []], "Input Dims": [[65536], [], [], [], [], [], []], "Ev Idx": 10014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650685222.362, "dur": 2.994, "args": { "External id": 16520,"Record function id": 0, "Concrete Inputs": ["[65536]", "[1]", "4", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650685226.231, "dur": 32.806, "args": { "External id": 16521,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["long int", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[65536], [65536], []], "Ev Idx": 10016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295650685286.355, "dur": 38124.551, "args": { "External id": 16522,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295650685287.877, "dur": 38120.451, "args": { "External id": 16523,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["long int"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 10018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650723426.529, "dur": 8.603, "args": { "External id": 16524,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723431.721, "dur": 1.191, "args": { "External id": 16525,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650723440.613, "dur": 104.316, "args": { "External id": 16526,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650723442.367, "dur": 8.420, "args": { "External id": 16527,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650723444.827, "dur": 5.102, "args": { "External id": 16528,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723448.688, "dur": 0.979, "args": { "External id": 16529,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650723452.113, "dur": 92.255, "args": { "External id": 16530,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650723454.033, "dur": 89.594, "args": { "External id": 16531,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650723548.633, "dur": 4.418, "args": { "External id": 16532,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723550.944, "dur": 0.656, "args": { "External id": 16533,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650723560.389, "dur": 2.708, "args": { "External id": 16534,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650723574.865, "dur": 7.310, "args": { "External id": 16535,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650723577.240, "dur": 4.639, "args": { "External id": 16536,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650723713.917, "dur": 213.362, "args": { "External id": 16537,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650723719.138, "dur": 2.509, "args": { "External id": 16538,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650723723.411, "dur": 203.321, "args": { "External id": 16539,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650723725.211, "dur": 0.607, "args": { "External id": 16540,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650723727.118, "dur": 26.876, "args": { "External id": 16541,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650723758.168, "dur": 6.245, "args": { "External id": 16542,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723762.974, "dur": 1.097, "args": { "External id": 16543,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650723765.430, "dur": 24.899, "args": { "External id": 16544,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650723767.003, "dur": 1.899, "args": { "External id": 16545,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650723770.256, "dur": 19.824, "args": { "External id": 16546,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650723773.941, "dur": 3.120, "args": { "External id": 16547,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650723792.094, "dur": 23.873, "args": { "External id": 16548,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650723817.754, "dur": 18.425, "args": { "External id": 16549,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650723839.247, "dur": 16.284, "args": { "External id": 16550,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650723856.975, "dur": 14.263, "args": { "External id": 16551,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650723875.517, "dur": 21.731, "args": { "External id": 16552,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650723877.504, "dur": 1.913, "args": { "External id": 16553,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723881.756, "dur": 0.753, "args": { "External id": 16554,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650723898.609, "dur": 13.703, "args": { "External id": 16555,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650723913.494, "dur": 12.395, "args": { "External id": 16556,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650723933.701, "dur": 2.023, "args": { "External id": 16557,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650723944.319, "dur": 4.085, "args": { "External id": 16558,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650723946.692, "dur": 0.761, "args": { "External id": 16559,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "0"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724060.732, "dur": 68.613, "args": { "External id": 16560,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724135.823, "dur": 6.586, "args": { "External id": 16561,"Record function id": 0, "Concrete Inputs": ["", "0", "0", "8192", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724138.799, "dur": 1.096, "args": { "External id": 16562,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "0"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650724144.140, "dur": 29.706, "args": { "External id": 16563,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650724179.726, "dur": 8.422, "args": { "External id": 16564,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650724181.794, "dur": 5.670, "args": { "External id": 16565,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724185.756, "dur": 1.449, "args": { "External id": 16566,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650724191.203, "dur": 57.405, "args": { "External id": 16567,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724192.586, "dur": 54.963, "args": { "External id": 16568,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650724254.531, "dur": 19.299, "args": { "External id": 16569,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724281.087, "dur": 4.603, "args": { "External id": 16570,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724283.459, "dur": 0.955, "args": { "External id": 16571,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650724292.544, "dur": 53.676, "args": { "External id": 16572,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650724293.849, "dur": 4.719, "args": { "External id": 16573,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650724295.054, "dur": 2.941, "args": { "External id": 16574,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724296.855, "dur": 0.789, "args": { "External id": 16575,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650724299.194, "dur": 46.616, "args": { "External id": 16576,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724300.161, "dur": 45.049, "args": { "External id": 16577,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724352.345, "dur": 4.043, "args": { "External id": 16578,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724354.368, "dur": 0.688, "args": { "External id": 16579,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650724362.968, "dur": 1.694, "args": { "External id": 16580,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650724372.547, "dur": 9.897, "args": { "External id": 16581,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650724374.837, "dur": 7.281, "args": { "External id": 16582,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650724483.284, "dur": 196.255, "args": { "External id": 16583,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650724485.947, "dur": 2.521, "args": { "External id": 16584,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650724489.922, "dur": 189.110, "args": { "External id": 16585,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650724491.575, "dur": 0.277, "args": { "External id": 16586,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650724493.155, "dur": 25.412, "args": { "External id": 16587,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650724520.193, "dur": 3.270, "args": { "External id": 16588,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724522.320, "dur": 0.926, "args": { "External id": 16589,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650724524.438, "dur": 28.626, "args": { "External id": 16590,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650724525.979, "dur": 1.662, "args": { "External id": 16591,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650724528.792, "dur": 23.939, "args": { "External id": 16592,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650724536.811, "dur": 2.978, "args": { "External id": 16593,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650724554.609, "dur": 22.394, "args": { "External id": 16594,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650724578.796, "dur": 14.536, "args": { "External id": 16595,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650724596.545, "dur": 15.050, "args": { "External id": 16596,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650724613.121, "dur": 14.049, "args": { "External id": 16597,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650724628.856, "dur": 20.871, "args": { "External id": 16598,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650724631.181, "dur": 1.932, "args": { "External id": 16599,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724635.110, "dur": 0.791, "args": { "External id": 16600,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650724653.259, "dur": 13.129, "args": { "External id": 16601,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650724667.517, "dur": 10.557, "args": { "External id": 16602,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650724686.338, "dur": 1.730, "args": { "External id": 16603,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724697.015, "dur": 3.654, "args": { "External id": 16604,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724699.498, "dur": 0.428, "args": { "External id": 16605,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "8192"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724769.370, "dur": 55.632, "args": { "External id": 16606,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724829.918, "dur": 5.143, "args": { "External id": 16607,"Record function id": 0, "Concrete Inputs": ["", "0", "8192", "16384", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724832.534, "dur": 1.502, "args": { "External id": 16608,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "16777216"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650724838.295, "dur": 23.991, "args": { "External id": 16609,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650724866.825, "dur": 5.093, "args": { "External id": 16610,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650724868.201, "dur": 3.172, "args": { "External id": 16611,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724870.112, "dur": 1.055, "args": { "External id": 16612,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650724874.749, "dur": 42.088, "args": { "External id": 16613,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724875.893, "dur": 40.472, "args": { "External id": 16614,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650724920.800, "dur": 15.519, "args": { "External id": 16615,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650724944.277, "dur": 4.091, "args": { "External id": 16616,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724946.465, "dur": 0.888, "args": { "External id": 16617,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650724952.179, "dur": 91.737, "args": { "External id": 16618,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650724953.040, "dur": 5.465, "args": { "External id": 16619,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650724953.748, "dur": 4.180, "args": { "External id": 16620,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650724955.021, "dur": 2.707, "args": { "External id": 16621,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650724961.336, "dur": 81.932, "args": { "External id": 16622,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650724962.472, "dur": 79.637, "args": { "External id": 16623,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650725050.376, "dur": 5.102, "args": { "External id": 16624,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725052.850, "dur": 1.052, "args": { "External id": 16625,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650725061.931, "dur": 1.692, "args": { "External id": 16626,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725071.716, "dur": 6.225, "args": { "External id": 16627,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725073.684, "dur": 4.011, "args": { "External id": 16628,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650725175.787, "dur": 219.150, "args": { "External id": 16629,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725178.177, "dur": 2.621, "args": { "External id": 16630,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650725182.795, "dur": 211.658, "args": { "External id": 16631,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650725184.575, "dur": 0.636, "args": { "External id": 16632,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650725188.592, "dur": 24.806, "args": { "External id": 16633,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650725215.088, "dur": 2.974, "args": { "External id": 16634,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725217.151, "dur": 0.656, "args": { "External id": 16635,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650725219.008, "dur": 44.596, "args": { "External id": 16636,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725220.384, "dur": 3.344, "args": { "External id": 16637,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650725225.000, "dur": 38.330, "args": { "External id": 16638,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650725245.403, "dur": 3.648, "args": { "External id": 16639,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650725265.176, "dur": 24.399, "args": { "External id": 16640,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650725291.236, "dur": 13.661, "args": { "External id": 16641,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650725307.596, "dur": 15.605, "args": { "External id": 16642,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650725324.515, "dur": 14.352, "args": { "External id": 16643,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650725340.867, "dur": 22.350, "args": { "External id": 16644,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650725343.075, "dur": 1.985, "args": { "External id": 16645,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725347.324, "dur": 0.669, "args": { "External id": 16646,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650725367.069, "dur": 13.291, "args": { "External id": 16647,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650725381.551, "dur": 11.948, "args": { "External id": 16648,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650725402.242, "dur": 2.176, "args": { "External id": 16649,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650725412.789, "dur": 3.473, "args": { "External id": 16650,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725415.092, "dur": 0.487, "args": { "External id": 16651,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "16384"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650725486.652, "dur": 82.428, "args": { "External id": 16652,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650725574.020, "dur": 7.302, "args": { "External id": 16653,"Record function id": 0, "Concrete Inputs": ["", "0", "16384", "24576", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725579.099, "dur": 1.198, "args": { "External id": 16654,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "33554432"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650725582.878, "dur": 31.915, "args": { "External id": 16655,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650725619.536, "dur": 7.964, "args": { "External id": 16656,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650725621.110, "dur": 5.779, "args": { "External id": 16657,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725623.371, "dur": 3.285, "args": { "External id": 16658,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650725630.283, "dur": 51.881, "args": { "External id": 16659,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650725631.325, "dur": 50.352, "args": { "External id": 16660,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650725687.964, "dur": 16.088, "args": { "External id": 16661,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650725709.704, "dur": 3.763, "args": { "External id": 16662,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725711.699, "dur": 0.894, "args": { "External id": 16663,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650725717.305, "dur": 50.214, "args": { "External id": 16664,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650725718.354, "dur": 5.634, "args": { "External id": 16665,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650725719.277, "dur": 4.162, "args": { "External id": 16666,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725722.709, "dur": 0.589, "args": { "External id": 16667,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650725724.566, "dur": 42.563, "args": { "External id": 16668,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650725725.551, "dur": 41.135, "args": { "External id": 16669,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650725771.399, "dur": 19.216, "args": { "External id": 16670,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725788.584, "dur": 0.886, "args": { "External id": 16671,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650725795.721, "dur": 1.652, "args": { "External id": 16672,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725807.065, "dur": 8.742, "args": { "External id": 16673,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725809.047, "dur": 6.466, "args": { "External id": 16674,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650725899.352, "dur": 228.562, "args": { "External id": 16675,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725901.416, "dur": 2.428, "args": { "External id": 16676,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650725905.716, "dur": 221.786, "args": { "External id": 16677,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650725907.412, "dur": 0.402, "args": { "External id": 16678,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650725908.956, "dur": 24.080, "args": { "External id": 16679,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650725936.966, "dur": 3.589, "args": { "External id": 16680,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650725939.046, "dur": 1.147, "args": { "External id": 16681,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650725941.463, "dur": 24.370, "args": { "External id": 16682,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650725942.838, "dur": 1.569, "args": { "External id": 16683,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650725945.587, "dur": 19.849, "args": { "External id": 16684,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650725950.165, "dur": 2.391, "args": { "External id": 16685,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650725967.194, "dur": 55.417, "args": { "External id": 16686,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650726025.469, "dur": 16.003, "args": { "External id": 16687,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650726044.613, "dur": 14.820, "args": { "External id": 16688,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650726061.135, "dur": 12.800, "args": { "External id": 16689,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650726078.312, "dur": 20.966, "args": { "External id": 16690,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650726080.478, "dur": 2.033, "args": { "External id": 16691,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726084.173, "dur": 0.645, "args": { "External id": 16692,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650726100.643, "dur": 13.040, "args": { "External id": 16693,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650726114.985, "dur": 11.373, "args": { "External id": 16694,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650726135.453, "dur": 2.202, "args": { "External id": 16695,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726147.095, "dur": 3.733, "args": { "External id": 16696,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726149.361, "dur": 0.591, "args": { "External id": 16697,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "24576"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650726220.654, "dur": 74.730, "args": { "External id": 16698,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726301.834, "dur": 5.835, "args": { "External id": 16699,"Record function id": 0, "Concrete Inputs": ["", "0", "24576", "32768", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726304.894, "dur": 1.306, "args": { "External id": 16700,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "50331648"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650726308.912, "dur": 26.009, "args": { "External id": 16701,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650726339.626, "dur": 6.887, "args": { "External id": 16702,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650726341.237, "dur": 4.510, "args": { "External id": 16703,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726344.593, "dur": 0.886, "args": { "External id": 16704,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650726349.752, "dur": 40.778, "args": { "External id": 16705,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650726350.749, "dur": 39.231, "args": { "External id": 16706,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650726394.299, "dur": 16.222, "args": { "External id": 16707,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726416.187, "dur": 3.632, "args": { "External id": 16708,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726418.326, "dur": 0.773, "args": { "External id": 16709,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650726423.661, "dur": 52.244, "args": { "External id": 16710,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650726426.681, "dur": 5.958, "args": { "External id": 16711,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650726427.561, "dur": 4.514, "args": { "External id": 16712,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726428.793, "dur": 3.123, "args": { "External id": 16713,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650726433.296, "dur": 42.173, "args": { "External id": 16714,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650726434.390, "dur": 40.286, "args": { "External id": 16715,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726479.676, "dur": 4.136, "args": { "External id": 16716,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726481.849, "dur": 0.909, "args": { "External id": 16717,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650726489.726, "dur": 1.585, "args": { "External id": 16718,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650726501.253, "dur": 6.218, "args": { "External id": 16719,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650726503.305, "dur": 3.909, "args": { "External id": 16720,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650726588.650, "dur": 198.392, "args": { "External id": 16721,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650726591.351, "dur": 2.952, "args": { "External id": 16722,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650726595.892, "dur": 190.686, "args": { "External id": 16723,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650726596.967, "dur": 0.499, "args": { "External id": 16724,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650726603.442, "dur": 21.026, "args": { "External id": 16725,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650726632.404, "dur": 3.184, "args": { "External id": 16726,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726634.533, "dur": 0.840, "args": { "External id": 16727,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650726636.598, "dur": 23.910, "args": { "External id": 16728,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650726637.920, "dur": 4.096, "args": { "External id": 16729,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650726643.205, "dur": 17.009, "args": { "External id": 16730,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650726645.766, "dur": 2.623, "args": { "External id": 16731,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650726662.092, "dur": 22.067, "args": { "External id": 16732,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650726685.864, "dur": 13.904, "args": { "External id": 16733,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650726702.440, "dur": 15.253, "args": { "External id": 16734,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650726721.301, "dur": 12.692, "args": { "External id": 16735,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650726735.432, "dur": 21.055, "args": { "External id": 16736,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650726737.412, "dur": 1.871, "args": { "External id": 16737,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726741.001, "dur": 0.971, "args": { "External id": 16738,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650726757.809, "dur": 13.204, "args": { "External id": 16739,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650726772.077, "dur": 11.263, "args": { "External id": 16740,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650726792.631, "dur": 1.592, "args": { "External id": 16741,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726802.529, "dur": 3.590, "args": { "External id": 16742,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726804.704, "dur": 0.574, "args": { "External id": 16743,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "32768"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650726864.462, "dur": 47.242, "args": { "External id": 16744,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650726916.328, "dur": 4.679, "args": { "External id": 16745,"Record function id": 0, "Concrete Inputs": ["", "0", "32768", "40960", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726918.807, "dur": 1.208, "args": { "External id": 16746,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "67108864"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650726922.219, "dur": 22.443, "args": { "External id": 16747,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650726948.748, "dur": 9.287, "args": { "External id": 16748,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650726952.220, "dur": 5.206, "args": { "External id": 16749,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650726954.246, "dur": 2.976, "args": { "External id": 16750,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650726959.866, "dur": 78.145, "args": { "External id": 16751,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650726960.778, "dur": 75.995, "args": { "External id": 16752,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650727043.685, "dur": 17.316, "args": { "External id": 16753,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727067.896, "dur": 6.732, "args": { "External id": 16754,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727072.738, "dur": 0.773, "args": { "External id": 16755,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650727078.478, "dur": 53.212, "args": { "External id": 16756,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650727079.555, "dur": 4.750, "args": { "External id": 16757,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650727080.809, "dur": 2.994, "args": { "External id": 16758,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727082.285, "dur": 1.078, "args": { "External id": 16759,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650727085.128, "dur": 46.192, "args": { "External id": 16760,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650727086.158, "dur": 44.627, "args": { "External id": 16761,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727137.487, "dur": 3.745, "args": { "External id": 16762,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727139.484, "dur": 0.608, "args": { "External id": 16763,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650727146.851, "dur": 1.245, "args": { "External id": 16764,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727155.275, "dur": 6.908, "args": { "External id": 16765,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727157.319, "dur": 4.612, "args": { "External id": 16766,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650727267.302, "dur": 191.373, "args": { "External id": 16767,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727269.765, "dur": 3.179, "args": { "External id": 16768,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650727277.017, "dur": 181.330, "args": { "External id": 16769,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650727278.395, "dur": 0.471, "args": { "External id": 16770,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650727279.947, "dur": 24.094, "args": { "External id": 16771,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650727305.562, "dur": 5.054, "args": { "External id": 16772,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727307.194, "dur": 3.099, "args": { "External id": 16773,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650727311.699, "dur": 25.222, "args": { "External id": 16774,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727312.987, "dur": 2.008, "args": { "External id": 16775,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650727318.111, "dur": 18.533, "args": { "External id": 16776,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650727320.910, "dur": 2.833, "args": { "External id": 16777,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650727338.194, "dur": 20.642, "args": { "External id": 16778,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650727360.194, "dur": 14.720, "args": { "External id": 16779,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650727377.931, "dur": 13.661, "args": { "External id": 16780,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650727392.891, "dur": 13.623, "args": { "External id": 16781,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650727408.022, "dur": 23.373, "args": { "External id": 16782,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650727410.281, "dur": 1.790, "args": { "External id": 16783,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727416.254, "dur": 1.221, "args": { "External id": 16784,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650727432.953, "dur": 12.692, "args": { "External id": 16785,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650727446.784, "dur": 10.543, "args": { "External id": 16786,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650727465.207, "dur": 1.776, "args": { "External id": 16787,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727475.553, "dur": 3.660, "args": { "External id": 16788,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727477.893, "dur": 0.485, "args": { "External id": 16789,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "40960"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650727545.224, "dur": 54.170, "args": { "External id": 16790,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727604.250, "dur": 9.161, "args": { "External id": 16791,"Record function id": 0, "Concrete Inputs": ["", "0", "40960", "49152", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727609.237, "dur": 3.083, "args": { "External id": 16792,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "83886080"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650727614.854, "dur": 25.687, "args": { "External id": 16793,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650727645.203, "dur": 5.903, "args": { "External id": 16794,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650727647.129, "dur": 3.363, "args": { "External id": 16795,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727649.234, "dur": 1.068, "args": { "External id": 16796,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650727653.256, "dur": 40.411, "args": { "External id": 16797,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650727654.598, "dur": 38.502, "args": { "External id": 16798,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650727699.793, "dur": 15.038, "args": { "External id": 16799,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727720.325, "dur": 3.627, "args": { "External id": 16800,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10295 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727722.232, "dur": 0.770, "args": { "External id": 16801,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650727727.444, "dur": 48.152, "args": { "External id": 16802,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650727728.526, "dur": 6.559, "args": { "External id": 16803,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650727729.345, "dur": 5.071, "args": { "External id": 16804,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10299 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727733.471, "dur": 0.622, "args": { "External id": 16805,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650727735.669, "dur": 39.566, "args": { "External id": 16806,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650727736.296, "dur": 38.466, "args": { "External id": 16807,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650727778.958, "dur": 4.317, "args": { "External id": 16808,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727781.204, "dur": 0.971, "args": { "External id": 16809,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10304 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650727788.384, "dur": 1.712, "args": { "External id": 16810,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10305 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727797.360, "dur": 8.107, "args": { "External id": 16811,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10306 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727801.687, "dur": 3.537, "args": { "External id": 16812,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650727886.102, "dur": 231.704, "args": { "External id": 16813,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10308 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727888.163, "dur": 4.153, "args": { "External id": 16814,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10309 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650727893.963, "dur": 223.366, "args": { "External id": 16815,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10310 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650727895.283, "dur": 0.194, "args": { "External id": 16816,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650727896.546, "dur": 20.445, "args": { "External id": 16817,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650727918.327, "dur": 6.242, "args": { "External id": 16818,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10313 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650727922.907, "dur": 1.454, "args": { "External id": 16819,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650727925.563, "dur": 23.670, "args": { "External id": 16820,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650727926.681, "dur": 1.657, "args": { "External id": 16821,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650727931.552, "dur": 17.416, "args": { "External id": 16822,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650727934.233, "dur": 2.792, "args": { "External id": 16823,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650727950.473, "dur": 19.454, "args": { "External id": 16824,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650727971.488, "dur": 51.348, "args": { "External id": 16825,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650728027.023, "dur": 18.511, "args": { "External id": 16826,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650728046.893, "dur": 13.656, "args": { "External id": 16827,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650728062.226, "dur": 27.212, "args": { "External id": 16828,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650728066.998, "dur": 2.110, "args": { "External id": 16829,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728072.643, "dur": 1.068, "args": { "External id": 16830,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650728090.722, "dur": 13.097, "args": { "External id": 16831,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650728104.880, "dur": 11.346, "args": { "External id": 16832,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650728125.490, "dur": 2.596, "args": { "External id": 16833,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728138.602, "dur": 3.860, "args": { "External id": 16834,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728141.200, "dur": 0.368, "args": { "External id": 16835,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "49152"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650728208.715, "dur": 71.422, "args": { "External id": 16836,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728286.851, "dur": 7.761, "args": { "External id": 16837,"Record function id": 0, "Concrete Inputs": ["", "0", "49152", "57344", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728292.189, "dur": 0.965, "args": { "External id": 16838,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "100663296"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650728296.054, "dur": 25.106, "args": { "External id": 16839,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650728326.408, "dur": 5.799, "args": { "External id": 16840,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650728327.962, "dur": 3.705, "args": { "External id": 16841,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728329.834, "dur": 1.622, "args": { "External id": 16842,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650728335.104, "dur": 44.871, "args": { "External id": 16843,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10338 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650728338.547, "dur": 40.653, "args": { "External id": 16844,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10339 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650728383.908, "dur": 16.747, "args": { "External id": 16845,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728406.558, "dur": 3.607, "args": { "External id": 16846,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728408.647, "dur": 0.732, "args": { "External id": 16847,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linear", "pid": 1336754, "tid": 1336754, "ts": 1295650728413.753, "dur": 49.042, "args": { "External id": 16848,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["c10::BFloat16", "c10::BFloat16", ""], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [32000, 2048], []], "Ev Idx": 10343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650728414.582, "dur": 5.784, "args": { "External id": 16849,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650728415.465, "dur": 4.394, "args": { "External id": 16850,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], []], "Input Dims": [[32000, 2048], [], []], "Ev Idx": 10345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728419.088, "dur": 0.635, "args": { "External id": 16851,"Record function id": 0, "Concrete Inputs": ["", "[2048, 32000]", "[1, 2048]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[32000, 2048], [], [], []], "Ev Idx": 10346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650728421.178, "dur": 41.141, "args": { "External id": 16852,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650728421.836, "dur": 39.723, "args": { "External id": 16853,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[2048, 1], [1, 2048]], "Input Dims": [[8192, 2048], [2048, 32000]], "Ev Idx": 10348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728466.632, "dur": 3.774, "args": { "External id": 16854,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["long int", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728468.733, "dur": 0.648, "args": { "External id": 16855,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["long int", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650728476.123, "dur": 1.753, "args": { "External id": 16856,"Record function id": 0, "Concrete Inputs": ["", "[-1, 32000]"], "Input type": ["c10::BFloat16", "ScalarList"], "Input Strides": [[32000, 1], []], "Input Dims": [[8192, 32000], []], "Ev Idx": 10351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::new_empty", "pid": 1336754, "tid": 1336754, "ts": 1295650728487.136, "dur": 6.075, "args": { "External id": 16857,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "6", "", "", "False"], "Input type": ["c10::BFloat16", "ScalarList", "Scalar", "", "", "Scalar"], "Input Strides": [[32000, 1], [], [], [], [], []], "Input Dims": [[8192, 32000], [], [], [], [], []], "Ev Idx": 10352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650728489.080, "dur": 3.865, "args": { "External id": 16858,"Record function id": 0, "Concrete Inputs": ["[8192, 1]", "6", "0", "", "False", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "Scalar", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650728573.653, "dur": 195.138, "args": { "External id": 16859,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650728577.945, "dur": 2.329, "args": { "External id": 16860,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::logsumexp", "pid": 1336754, "tid": 1336754, "ts": 1295650728582.234, "dur": 185.833, "args": { "External id": 16861,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", "float"], "Input Strides": [[1, 1], [], [], [1]], "Input Dims": [[8192, 1], [], [], [0]], "Ev Idx": 10356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::real", "pid": 1336754, "tid": 1336754, "ts": 1295650728583.502, "dur": 0.458, "args": { "External id": 16862,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::amax", "pid": 1336754, "tid": 1336754, "ts": 1295650728587.104, "dur": 21.590, "args": { "External id": 16863,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "True"], "Input type": ["float", "ScalarList", "Scalar"], "Input Strides": [[1, 1], [], []], "Input Dims": [[8192, 1], [], []], "Ev Idx": 10358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::squeeze", "pid": 1336754, "tid": 1336754, "ts": 1295650728610.297, "dur": 5.688, "args": { "External id": 16864,"Record function id": 0, "Concrete Inputs": ["", "[-1]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1, 1], []], "Input Dims": [[8192, 1], []], "Ev Idx": 10359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728614.620, "dur": 1.048, "args": { "External id": 16865,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1, 1], [], [], []], "Input Dims": [[8192, 1], [], [], []], "Ev Idx": 10360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650728616.860, "dur": 20.628, "args": { "External id": 16866,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295650728618.100, "dur": 1.541, "args": { "External id": 16867,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295650728620.921, "dur": 16.286, "args": { "External id": 16868,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[1], [1]], "Input Dims": [[8192], [0]], "Ev Idx": 10363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650728622.867, "dur": 2.727, "args": { "External id": 16869,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295650728638.710, "dur": 20.912, "args": { "External id": 16870,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::masked_fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650728660.934, "dur": 17.417, "args": { "External id": 16871,"Record function id": 0, "Concrete Inputs": ["", "", "0"], "Input type": ["float", "bool", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sub", "pid": 1336754, "tid": 1336754, "ts": 1295650728681.329, "dur": 14.661, "args": { "External id": 16872,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1, 1], [1, 1], []], "Input Dims": [[8192, 1], [8192, 1], []], "Ev Idx": 10367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::exp_", "pid": 1336754, "tid": 1336754, "ts": 1295650728699.301, "dur": 14.591, "args": { "External id": 16873,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1, 1]], "Input Dims": [[8192, 1]], "Ev Idx": 10368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650728715.576, "dur": 21.587, "args": { "External id": 16874,"Record function id": 0, "Concrete Inputs": ["", "[-1]", "False", "", ""], "Input type": ["float", "ScalarList", "Scalar", "", "float"], "Input Strides": [[1, 1], [], [], [], [1]], "Input Dims": [[8192, 1], [], [], [], [0]], "Ev Idx": 10369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295650728717.068, "dur": 1.750, "args": { "External id": 16875,"Record function id": 0, "Concrete Inputs": ["", "[8192]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 10370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728722.230, "dur": 0.905, "args": { "External id": 16876,"Record function id": 0, "Concrete Inputs": ["", "[8192, 1]", "[1, 0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[8192], [], [], []], "Ev Idx": 10371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::log_", "pid": 1336754, "tid": 1336754, "ts": 1295650728738.760, "dur": 13.816, "args": { "External id": 16877,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[8192]], "Ev Idx": 10372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650728753.794, "dur": 12.886, "args": { "External id": 16878,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [1], []], "Input Dims": [[8192], [8192], []], "Ev Idx": 10373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295650728776.836, "dur": 1.676, "args": { "External id": 16879,"Record function id": 0, "Concrete Inputs": ["", "[8192]"], "Input type": ["float", "ScalarList"], "Input Strides": [[1], []], "Input Dims": [[8192], []], "Ev Idx": 10374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728787.059, "dur": 3.733, "args": { "External id": 16880,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["float", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], []], "Input Dims": [[65536], [], [], [], []], "Ev Idx": 10375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728789.545, "dur": 0.476, "args": { "External id": 16881,"Record function id": 0, "Concrete Inputs": ["", "[8192]", "[1]", "57344"], "Input type": ["float", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650728852.145, "dur": 48.149, "args": { "External id": 16882,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[32000, 1], [2048, 1]], "Input Dims": [[8192, 32000], [32000, 2048]], "Ev Idx": 10377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::slice", "pid": 1336754, "tid": 1336754, "ts": 1295650728904.860, "dur": 4.195, "args": { "External id": 16883,"Record function id": 0, "Concrete Inputs": ["", "0", "57344", "65536", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar", "Scalar", "Scalar"], "Input Strides": [[2048, 1], [], [], [], []], "Input Dims": [[65536, 2048], [], [], [], []], "Ev Idx": 10378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728907.270, "dur": 0.794, "args": { "External id": 16884,"Record function id": 0, "Concrete Inputs": ["", "[8192, 2048]", "[2048, 1]", "117440512"], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", "Scalar"], "Input Strides": [[2048, 1], [], [], []], "Input Dims": [[65536, 2048], [], [], []], "Ev Idx": 10379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650728910.412, "dur": 21.772, "args": { "External id": 16885,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[8192, 2048], [8192, 2048], []], "Ev Idx": 10380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::t", "pid": 1336754, "tid": 1336754, "ts": 1295650728936.314, "dur": 7.193, "args": { "External id": 16886,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[32000, 1]], "Input Dims": [[8192, 32000]], "Ev Idx": 10381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::transpose", "pid": 1336754, "tid": 1336754, "ts": 1295650728937.596, "dur": 5.365, "args": { "External id": 16887,"Record function id": 0, "Concrete Inputs": ["", "0", "1"], "Input type": ["c10::BFloat16", "Scalar", "Scalar"], "Input Strides": [[32000, 1], [], []], "Input Dims": [[8192, 32000], [], []], "Ev Idx": 10382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650728941.245, "dur": 1.551, "args": { "External id": 16888,"Record function id": 0, "Concrete Inputs": ["", "[32000, 8192]", "[1, 32000]", ""], "Input type": ["c10::BFloat16", "ScalarList", "ScalarList", ""], "Input Strides": [[32000, 1], [], [], []], "Input Dims": [[8192, 32000], [], [], []], "Ev Idx": 10383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::matmul", "pid": 1336754, "tid": 1336754, "ts": 1295650728945.510, "dur": 74.938, "args": { "External id": 16889,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mm", "pid": 1336754, "tid": 1336754, "ts": 1295650728946.710, "dur": 37.117, "args": { "External id": 16890,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["c10::BFloat16", "c10::BFloat16"], "Input Strides": [[1, 32000], [2048, 1]], "Input Dims": [[32000, 8192], [8192, 2048]], "Ev Idx": 10385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650729027.000, "dur": 20.506, "args": { "External id": 16891,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "c10::BFloat16", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650729053.075, "dur": 28.399, "args": { "External id": 16892,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[1], []], "Input Dims": [[65536], []], "Ev Idx": 10387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::sum", "pid": 1336754, "tid": 1336754, "ts": 1295650729055.849, "dur": 25.230, "args": { "External id": 16893,"Record function id": 0, "Concrete Inputs": ["", "[]", "False", ""], "Input type": ["float", "ScalarList", "Scalar", ""], "Input Strides": [[1], [], [], []], "Input Dims": [[65536], [], [], []], "Ev Idx": 10388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650729061.769, "dur": 2.781, "args": { "External id": 16894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295650729087.528, "dur": 73.843, "args": { "External id": 16895,"Record function id": 0, "Concrete Inputs": ["", "", "15", "False", "False", ""], "Input type": ["float", "", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], []], "Ev Idx": 10390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_to_copy", "pid": 1336754, "tid": 1336754, "ts": 1295650729089.168, "dur": 71.997, "args": { "External id": 16896,"Record function id": 0, "Concrete Inputs": ["", "15", "", "", "", "False", ""], "Input type": ["float", "Scalar", "", "", "", "Scalar", ""], "Input Strides": [[2048, 1], [], [], [], [], [], []], "Input Dims": [[32000, 2048], [], [], [], [], [], []], "Ev Idx": 10391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650729138.484, "dur": 5.419, "args": { "External id": 16897,"Record function id": 0, "Concrete Inputs": ["[32000, 2048]", "[2048, 1]", "15", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295650729145.124, "dur": 15.586, "args": { "External id": 16898,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["c10::BFloat16", "float", "Scalar"], "Input Strides": [[2048, 1], [2048, 1], []], "Input Dims": [[32000, 2048], [32000, 2048], []], "Ev Idx": 10393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650729174.307, "dur": 4.847, "args": { "External id": 16899,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10394 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650729176.070, "dur": 2.820, "args": { "External id": 16900,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[65536, 2048]], "Ev Idx": 10395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::detach", "pid": 1336754, "tid": 1336754, "ts": 1295650729180.170, "dur": 0.852, "args": { "External id": 16901,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10396 } }, { "ph": "X", "cat": "cpu_op", "name": "detach", "pid": 1336754, "tid": 1336754, "ts": 1295650729180.448, "dur": 0.486, "args": { "External id": 16902,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["c10::BFloat16"], "Input Strides": [[2048, 1]], "Input Dims": [[32000, 2048]], "Ev Idx": 10397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650729223.447, "dur": 41.826, "args": { "External id": 16903,"Sequence number": 246768, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add_", "pid": 1336754, "tid": 1336754, "ts": 1295650729268.182, "dur": 15.483, "args": { "External id": 16904,"Sequence number": 246769, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10399 } }, { "ph": "s", "id": 2, "pid": 1336754, "tid": 1336754, "ts": 1295650729268.182, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "user_annotation", "name": "FSDP::post_forward", "pid": 1336754, "tid": 1336754, "ts": 1295650729389.448, "dur": 39.182, "args": { "External id": 16905,"Record function id": 0, "Ev Idx": 10400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336754, "tid": 1336754, "ts": 1295650729531.536, "dur": 35.769, "args": { "External id": 16906,"Sequence number": 246770, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10401 } }, { "ph": "s", "id": 1, "pid": 1336754, "tid": 1336754, "ts": 1295650729531.536, "cat": "fwdbwd", "name": "fwdbwd" }, { "ph": "X", "cat": "cpu_op", "name": "aten::ones_like", "pid": 1336754, "tid": 1336754, "ts": 1295650729624.611, "dur": 28.104, "args": { "External id": 16907,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295650729626.261, "dur": 8.234, "args": { "External id": 16908,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "False", "1"], "Input type": ["float", "", "", "", "Scalar", "Scalar"], "Input Strides": [[1], [], [], [], [], []], "Input Dims": [[1], [], [], [], [], []], "Ev Idx": 10403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_strided", "pid": 1336754, "tid": 1336754, "ts": 1295650729630.174, "dur": 3.763, "args": { "External id": 16909,"Record function id": 0, "Concrete Inputs": ["[1]", "[1]", "6", "0", "", "False"], "Input type": ["ScalarList", "ScalarList", "Scalar", "Scalar", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295650729636.437, "dur": 15.954, "args": { "External id": 16910,"Record function id": 0, "Concrete Inputs": ["", "1."], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336754, "tid": 1336754, "ts": 1295652033242.943, "dur": 51.503, "args": { "External id": 16911,"Sequence number": 246771, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::div", "pid": 1336754, "tid": 1336754, "ts": 1295652033302.925, "dur": 18.284, "args": { "External id": 16912,"Sequence number": 246772, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "long int"], "Input Strides": [[1], []], "Input Dims": [[1], []], "Ev Idx": 10407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295652033328.031, "dur": 24.009, "args": { "External id": 16913,"Sequence number": 246773, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295652033870.513, "dur": 22.109, "args": { "External id": 16914,"Sequence number": 246774, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295652034409.248, "dur": 35.560, "args": { "External id": 16915,"Sequence number": 246775, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "long int", "Scalar"], "Input Strides": [[1], [], []], "Input Dims": [[1], [], []], "Ev Idx": 10410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336754, "tid": 1336754, "ts": 1295652035957.453, "dur": 3291.327, "args": { "External id": 16916,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_norm", "pid": 1336754, "tid": 1336754, "ts": 1295652036579.925, "dur": 1110.342, "args": { "External id": 16917,"Record function id": 0, "Concrete Inputs": ["", "2.", ""], "Input type": ["TensorList", "Scalar", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 10412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zeros", "pid": 1336754, "tid": 1336754, "ts": 1295652036598.362, "dur": 61.761, "args": { "External id": 16918,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 10413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295652036601.581, "dur": 11.348, "args": { "External id": 16919,"Record function id": 0, "Concrete Inputs": ["[36375]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 10414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::zero_", "pid": 1336754, "tid": 1336754, "ts": 1295652036615.659, "dur": 44.168, "args": { "External id": 16920,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[1]], "Input Dims": [[36375]], "Ev Idx": 10415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::fill_", "pid": 1336754, "tid": 1336754, "ts": 1295652036617.632, "dur": 41.609, "args": { "External id": 16921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[1], []], "Input Dims": [[36375], []], "Ev Idx": 10416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039285.269, "dur": 2.859, "args": { "External id": 16922,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039290.294, "dur": 0.473, "args": { "External id": 16923,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039292.222, "dur": 0.390, "args": { "External id": 16924,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039293.827, "dur": 0.237, "args": { "External id": 16925,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039295.793, "dur": 0.174, "args": { "External id": 16926,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039297.531, "dur": 0.234, "args": { "External id": 16927,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039299.097, "dur": 0.204, "args": { "External id": 16928,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039302.853, "dur": 0.212, "args": { "External id": 16929,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039303.986, "dur": 0.446, "args": { "External id": 16930,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039305.380, "dur": 0.404, "args": { "External id": 16931,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039306.732, "dur": 0.228, "args": { "External id": 16932,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039307.658, "dur": 0.204, "args": { "External id": 16933,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039308.748, "dur": 0.246, "args": { "External id": 16934,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039309.859, "dur": 0.421, "args": { "External id": 16935,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039311.138, "dur": 0.230, "args": { "External id": 16936,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039314.273, "dur": 0.216, "args": { "External id": 16937,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039315.584, "dur": 0.204, "args": { "External id": 16938,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039316.786, "dur": 0.214, "args": { "External id": 16939,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039317.867, "dur": 0.200, "args": { "External id": 16940,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039318.822, "dur": 0.210, "args": { "External id": 16941,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039319.919, "dur": 0.202, "args": { "External id": 16942,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039321.095, "dur": 0.243, "args": { "External id": 16943,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039322.159, "dur": 0.195, "args": { "External id": 16944,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039325.049, "dur": 0.203, "args": { "External id": 16945,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039326.134, "dur": 0.231, "args": { "External id": 16946,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039327.436, "dur": 0.202, "args": { "External id": 16947,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039328.810, "dur": 0.215, "args": { "External id": 16948,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039329.726, "dur": 0.205, "args": { "External id": 16949,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039331.032, "dur": 0.206, "args": { "External id": 16950,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039332.245, "dur": 0.201, "args": { "External id": 16951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039333.385, "dur": 0.200, "args": { "External id": 16952,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039336.475, "dur": 0.202, "args": { "External id": 16953,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039337.586, "dur": 0.225, "args": { "External id": 16954,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039338.878, "dur": 0.236, "args": { "External id": 16955,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039339.974, "dur": 0.225, "args": { "External id": 16956,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039341.285, "dur": 0.209, "args": { "External id": 16957,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039342.225, "dur": 0.375, "args": { "External id": 16958,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039343.554, "dur": 0.202, "args": { "External id": 16959,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039344.632, "dur": 0.206, "args": { "External id": 16960,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039347.515, "dur": 0.496, "args": { "External id": 16961,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039348.917, "dur": 0.447, "args": { "External id": 16962,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039350.274, "dur": 0.227, "args": { "External id": 16963,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039351.542, "dur": 0.209, "args": { "External id": 16964,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039352.594, "dur": 0.217, "args": { "External id": 16965,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039353.774, "dur": 0.210, "args": { "External id": 16966,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039355.934, "dur": 0.216, "args": { "External id": 16967,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039357.075, "dur": 0.198, "args": { "External id": 16968,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039360.379, "dur": 0.208, "args": { "External id": 16969,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039361.657, "dur": 0.273, "args": { "External id": 16970,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039362.666, "dur": 0.206, "args": { "External id": 16971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039363.603, "dur": 0.237, "args": { "External id": 16972,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039364.613, "dur": 0.206, "args": { "External id": 16973,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039365.738, "dur": 0.204, "args": { "External id": 16974,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039366.816, "dur": 0.207, "args": { "External id": 16975,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039367.732, "dur": 0.206, "args": { "External id": 16976,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039371.169, "dur": 0.199, "args": { "External id": 16977,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039372.100, "dur": 0.467, "args": { "External id": 16978,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039373.280, "dur": 0.201, "args": { "External id": 16979,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039374.171, "dur": 0.204, "args": { "External id": 16980,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039375.086, "dur": 0.207, "args": { "External id": 16981,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039376.263, "dur": 0.461, "args": { "External id": 16982,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039377.426, "dur": 0.415, "args": { "External id": 16983,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039378.698, "dur": 0.411, "args": { "External id": 16984,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039382.000, "dur": 0.417, "args": { "External id": 16985,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039383.285, "dur": 0.435, "args": { "External id": 16986,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039384.656, "dur": 0.428, "args": { "External id": 16987,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039385.864, "dur": 0.405, "args": { "External id": 16988,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039386.959, "dur": 0.203, "args": { "External id": 16989,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039388.086, "dur": 0.415, "args": { "External id": 16990,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039389.209, "dur": 0.240, "args": { "External id": 16991,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039390.172, "dur": 0.202, "args": { "External id": 16992,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039393.272, "dur": 0.203, "args": { "External id": 16993,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039394.493, "dur": 0.204, "args": { "External id": 16994,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039395.595, "dur": 0.201, "args": { "External id": 16995,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039396.485, "dur": 0.199, "args": { "External id": 16996,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039397.562, "dur": 0.204, "args": { "External id": 16997,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039398.660, "dur": 0.201, "args": { "External id": 16998,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039400.595, "dur": 0.207, "args": { "External id": 16999,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039401.613, "dur": 0.198, "args": { "External id": 17000,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039404.649, "dur": 0.203, "args": { "External id": 17001,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039405.591, "dur": 0.207, "args": { "External id": 17002,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039406.555, "dur": 0.207, "args": { "External id": 17003,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039407.491, "dur": 0.431, "args": { "External id": 17004,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039408.695, "dur": 0.205, "args": { "External id": 17005,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039409.634, "dur": 0.204, "args": { "External id": 17006,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039410.574, "dur": 0.204, "args": { "External id": 17007,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039411.514, "dur": 0.206, "args": { "External id": 17008,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039414.593, "dur": 0.207, "args": { "External id": 17009,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039415.548, "dur": 0.200, "args": { "External id": 17010,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039416.449, "dur": 0.205, "args": { "External id": 17011,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039417.429, "dur": 0.205, "args": { "External id": 17012,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039418.331, "dur": 0.204, "args": { "External id": 17013,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039419.238, "dur": 0.204, "args": { "External id": 17014,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039420.996, "dur": 0.202, "args": { "External id": 17015,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039421.933, "dur": 0.204, "args": { "External id": 17016,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039425.001, "dur": 0.203, "args": { "External id": 17017,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039425.904, "dur": 0.204, "args": { "External id": 17018,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039426.806, "dur": 0.207, "args": { "External id": 17019,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039427.929, "dur": 0.206, "args": { "External id": 17020,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039428.842, "dur": 0.206, "args": { "External id": 17021,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039429.785, "dur": 0.197, "args": { "External id": 17022,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039430.705, "dur": 0.203, "args": { "External id": 17023,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039431.626, "dur": 0.203, "args": { "External id": 17024,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039434.409, "dur": 0.204, "args": { "External id": 17025,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039435.572, "dur": 0.207, "args": { "External id": 17026,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039436.539, "dur": 0.205, "args": { "External id": 17027,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039437.601, "dur": 0.207, "args": { "External id": 17028,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039438.605, "dur": 0.204, "args": { "External id": 17029,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039439.722, "dur": 0.209, "args": { "External id": 17030,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039441.140, "dur": 0.214, "args": { "External id": 17031,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039442.115, "dur": 0.204, "args": { "External id": 17032,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039445.475, "dur": 0.441, "args": { "External id": 17033,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039446.768, "dur": 0.412, "args": { "External id": 17034,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039447.892, "dur": 0.392, "args": { "External id": 17035,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039449.178, "dur": 0.412, "args": { "External id": 17036,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039450.449, "dur": 0.201, "args": { "External id": 17037,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039451.532, "dur": 0.386, "args": { "External id": 17038,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039452.791, "dur": 0.374, "args": { "External id": 17039,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039454.032, "dur": 0.553, "args": { "External id": 17040,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039457.359, "dur": 0.373, "args": { "External id": 17041,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039458.439, "dur": 0.205, "args": { "External id": 17042,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039459.398, "dur": 0.201, "args": { "External id": 17043,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039460.299, "dur": 0.202, "args": { "External id": 17044,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039461.271, "dur": 0.204, "args": { "External id": 17045,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039462.274, "dur": 0.205, "args": { "External id": 17046,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039463.213, "dur": 0.206, "args": { "External id": 17047,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039464.122, "dur": 0.210, "args": { "External id": 17048,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039466.886, "dur": 0.213, "args": { "External id": 17049,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039467.862, "dur": 0.205, "args": { "External id": 17050,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039468.985, "dur": 0.206, "args": { "External id": 17051,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039469.929, "dur": 0.205, "args": { "External id": 17052,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039470.862, "dur": 0.204, "args": { "External id": 17053,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039471.786, "dur": 0.200, "args": { "External id": 17054,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039472.697, "dur": 0.422, "args": { "External id": 17055,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039473.822, "dur": 0.377, "args": { "External id": 17056,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039476.697, "dur": 0.432, "args": { "External id": 17057,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039477.877, "dur": 0.393, "args": { "External id": 17058,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039478.964, "dur": 0.430, "args": { "External id": 17059,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039480.097, "dur": 0.220, "args": { "External id": 17060,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039481.029, "dur": 0.202, "args": { "External id": 17061,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039481.926, "dur": 0.396, "args": { "External id": 17062,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039483.039, "dur": 0.373, "args": { "External id": 17063,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039484.300, "dur": 0.395, "args": { "External id": 17064,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039487.326, "dur": 0.483, "args": { "External id": 17065,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039488.583, "dur": 0.201, "args": { "External id": 17066,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039489.557, "dur": 0.205, "args": { "External id": 17067,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039490.456, "dur": 0.203, "args": { "External id": 17068,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039491.345, "dur": 0.204, "args": { "External id": 17069,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039492.250, "dur": 0.204, "args": { "External id": 17070,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039493.564, "dur": 0.202, "args": { "External id": 17071,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039494.509, "dur": 0.217, "args": { "External id": 17072,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039497.208, "dur": 0.217, "args": { "External id": 17073,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039498.153, "dur": 0.203, "args": { "External id": 17074,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039499.084, "dur": 0.207, "args": { "External id": 17075,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039500.026, "dur": 0.203, "args": { "External id": 17076,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039500.955, "dur": 0.211, "args": { "External id": 17077,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039501.893, "dur": 0.200, "args": { "External id": 17078,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039503.036, "dur": 0.206, "args": { "External id": 17079,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039504.146, "dur": 0.200, "args": { "External id": 17080,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039508.281, "dur": 0.215, "args": { "External id": 17081,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039509.403, "dur": 0.203, "args": { "External id": 17082,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039510.372, "dur": 0.201, "args": { "External id": 17083,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039511.294, "dur": 0.201, "args": { "External id": 17084,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039512.215, "dur": 0.198, "args": { "External id": 17085,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039513.141, "dur": 0.202, "args": { "External id": 17086,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039514.080, "dur": 0.209, "args": { "External id": 17087,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039515.001, "dur": 0.203, "args": { "External id": 17088,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039517.813, "dur": 0.206, "args": { "External id": 17089,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039519.041, "dur": 0.210, "args": { "External id": 17090,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039520.168, "dur": 0.200, "args": { "External id": 17091,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039521.250, "dur": 0.203, "args": { "External id": 17092,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039522.148, "dur": 0.206, "args": { "External id": 17093,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039523.231, "dur": 0.207, "args": { "External id": 17094,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039524.748, "dur": 0.201, "args": { "External id": 17095,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039525.725, "dur": 0.202, "args": { "External id": 17096,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039528.559, "dur": 0.200, "args": { "External id": 17097,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039529.666, "dur": 0.204, "args": { "External id": 17098,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039530.614, "dur": 0.201, "args": { "External id": 17099,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039531.545, "dur": 0.201, "args": { "External id": 17100,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039532.446, "dur": 0.202, "args": { "External id": 17101,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039533.348, "dur": 0.209, "args": { "External id": 17102,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039534.282, "dur": 0.205, "args": { "External id": 17103,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039535.193, "dur": 0.207, "args": { "External id": 17104,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039538.268, "dur": 0.210, "args": { "External id": 17105,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039539.190, "dur": 0.196, "args": { "External id": 17106,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039540.133, "dur": 0.201, "args": { "External id": 17107,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039541.075, "dur": 0.197, "args": { "External id": 17108,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039542.007, "dur": 0.198, "args": { "External id": 17109,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039542.913, "dur": 0.200, "args": { "External id": 17110,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039543.820, "dur": 0.198, "args": { "External id": 17111,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039544.731, "dur": 0.202, "args": { "External id": 17112,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039547.128, "dur": 0.445, "args": { "External id": 17113,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039548.279, "dur": 0.409, "args": { "External id": 17114,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039549.433, "dur": 0.400, "args": { "External id": 17115,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039550.553, "dur": 0.446, "args": { "External id": 17116,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039551.745, "dur": 0.200, "args": { "External id": 17117,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039552.692, "dur": 0.400, "args": { "External id": 17118,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039553.837, "dur": 0.398, "args": { "External id": 17119,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039554.939, "dur": 0.377, "args": { "External id": 17120,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039557.612, "dur": 0.218, "args": { "External id": 17121,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039558.752, "dur": 0.413, "args": { "External id": 17122,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039560.272, "dur": 0.207, "args": { "External id": 17123,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039561.200, "dur": 0.205, "args": { "External id": 17124,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039562.262, "dur": 0.204, "args": { "External id": 17125,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039563.178, "dur": 0.202, "args": { "External id": 17126,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039564.277, "dur": 0.201, "args": { "External id": 17127,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039565.210, "dur": 0.447, "args": { "External id": 17128,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039568.408, "dur": 0.409, "args": { "External id": 17129,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039569.570, "dur": 0.398, "args": { "External id": 17130,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039570.670, "dur": 0.416, "args": { "External id": 17131,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039572.003, "dur": 0.414, "args": { "External id": 17132,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039573.130, "dur": 0.207, "args": { "External id": 17133,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039574.225, "dur": 0.416, "args": { "External id": 17134,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039575.521, "dur": 0.404, "args": { "External id": 17135,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039576.648, "dur": 0.373, "args": { "External id": 17136,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039579.891, "dur": 0.208, "args": { "External id": 17137,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039580.810, "dur": 0.202, "args": { "External id": 17138,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039581.745, "dur": 0.209, "args": { "External id": 17139,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10634 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039582.662, "dur": 0.202, "args": { "External id": 17140,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10635 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039583.581, "dur": 0.204, "args": { "External id": 17141,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10636 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039584.558, "dur": 0.200, "args": { "External id": 17142,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10637 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039585.468, "dur": 0.204, "args": { "External id": 17143,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10638 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039586.377, "dur": 0.205, "args": { "External id": 17144,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10639 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039589.357, "dur": 0.207, "args": { "External id": 17145,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10640 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039590.266, "dur": 0.204, "args": { "External id": 17146,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10641 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039591.206, "dur": 0.201, "args": { "External id": 17147,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10642 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039592.121, "dur": 0.208, "args": { "External id": 17148,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10643 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039593.020, "dur": 0.200, "args": { "External id": 17149,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10644 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039594.003, "dur": 0.354, "args": { "External id": 17150,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10645 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039595.275, "dur": 0.362, "args": { "External id": 17151,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10646 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039596.566, "dur": 0.204, "args": { "External id": 17152,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10647 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039600.333, "dur": 0.204, "args": { "External id": 17153,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10648 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039601.248, "dur": 0.208, "args": { "External id": 17154,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10649 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039602.623, "dur": 0.207, "args": { "External id": 17155,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10650 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039603.541, "dur": 0.241, "args": { "External id": 17156,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10651 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039604.494, "dur": 0.204, "args": { "External id": 17157,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10652 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039605.453, "dur": 0.199, "args": { "External id": 17158,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10653 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039606.387, "dur": 0.202, "args": { "External id": 17159,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10654 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039607.314, "dur": 0.200, "args": { "External id": 17160,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10655 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039609.963, "dur": 0.202, "args": { "External id": 17161,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10656 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039610.914, "dur": 0.200, "args": { "External id": 17162,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10657 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039611.878, "dur": 0.205, "args": { "External id": 17163,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10658 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039612.796, "dur": 0.200, "args": { "External id": 17164,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10659 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039613.690, "dur": 0.204, "args": { "External id": 17165,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10660 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039614.829, "dur": 0.197, "args": { "External id": 17166,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10661 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039615.719, "dur": 0.202, "args": { "External id": 17167,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10662 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039616.895, "dur": 0.196, "args": { "External id": 17168,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10663 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039620.082, "dur": 0.204, "args": { "External id": 17169,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10664 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039621.005, "dur": 0.203, "args": { "External id": 17170,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10665 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039622.087, "dur": 0.207, "args": { "External id": 17171,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10666 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039623.007, "dur": 0.202, "args": { "External id": 17172,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10667 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039623.922, "dur": 0.201, "args": { "External id": 17173,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10668 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039624.836, "dur": 0.202, "args": { "External id": 17174,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10669 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039625.732, "dur": 0.203, "args": { "External id": 17175,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10670 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039626.636, "dur": 0.205, "args": { "External id": 17176,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10671 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039629.603, "dur": 0.206, "args": { "External id": 17177,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10672 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039634.953, "dur": 0.268, "args": { "External id": 17178,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10673 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039636.048, "dur": 0.207, "args": { "External id": 17179,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10674 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039637.054, "dur": 0.207, "args": { "External id": 17180,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10675 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039638.028, "dur": 0.204, "args": { "External id": 17181,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10676 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039639.003, "dur": 0.199, "args": { "External id": 17182,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10677 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039639.958, "dur": 0.198, "args": { "External id": 17183,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10678 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039640.864, "dur": 0.207, "args": { "External id": 17184,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10679 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039644.008, "dur": 0.405, "args": { "External id": 17185,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10680 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039645.281, "dur": 0.408, "args": { "External id": 17186,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10681 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039646.427, "dur": 0.418, "args": { "External id": 17187,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10682 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039647.541, "dur": 0.388, "args": { "External id": 17188,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10683 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039648.662, "dur": 0.202, "args": { "External id": 17189,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10684 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039649.642, "dur": 0.379, "args": { "External id": 17190,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10685 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039651.212, "dur": 0.533, "args": { "External id": 17191,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10686 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039652.476, "dur": 0.408, "args": { "External id": 17192,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10687 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039655.174, "dur": 0.420, "args": { "External id": 17193,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10688 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039656.495, "dur": 0.419, "args": { "External id": 17194,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10689 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039659.127, "dur": 0.218, "args": { "External id": 17195,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10690 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039660.307, "dur": 0.202, "args": { "External id": 17196,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10691 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039661.210, "dur": 0.198, "args": { "External id": 17197,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10692 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039662.122, "dur": 0.202, "args": { "External id": 17198,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10693 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039663.127, "dur": 0.208, "args": { "External id": 17199,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10694 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039664.224, "dur": 0.194, "args": { "External id": 17200,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10695 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039666.795, "dur": 0.428, "args": { "External id": 17201,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10696 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039668.201, "dur": 0.375, "args": { "External id": 17202,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10697 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039669.435, "dur": 0.395, "args": { "External id": 17203,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10698 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039670.722, "dur": 0.505, "args": { "External id": 17204,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10699 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039672.131, "dur": 0.198, "args": { "External id": 17205,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10700 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039673.056, "dur": 0.377, "args": { "External id": 17206,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10701 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039674.379, "dur": 0.399, "args": { "External id": 17207,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10702 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039675.659, "dur": 0.400, "args": { "External id": 17208,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10703 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039678.656, "dur": 0.403, "args": { "External id": 17209,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10704 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039680.033, "dur": 0.201, "args": { "External id": 17210,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10705 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039680.925, "dur": 0.202, "args": { "External id": 17211,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10706 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652039682.015, "dur": 0.197, "args": { "External id": 17212,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 10707 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336754, "tid": 1336754, "ts": 1295652039737.143, "dur": 1575.247, "args": { "External id": 17213,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10708 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::stack", "pid": 1336754, "tid": 1336754, "ts": 1295652040210.988, "dur": 1007.633, "args": { "External id": 17214,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10709 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040219.052, "dur": 8.203, "args": { "External id": 17215,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10710 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040223.344, "dur": 3.219, "args": { "External id": 17216,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10711 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040228.023, "dur": 14.407, "args": { "External id": 17217,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10712 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040239.614, "dur": 2.459, "args": { "External id": 17218,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10713 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040243.150, "dur": 3.423, "args": { "External id": 17219,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10714 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040246.066, "dur": 0.421, "args": { "External id": 17220,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10715 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040247.052, "dur": 1.450, "args": { "External id": 17221,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10716 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040247.936, "dur": 0.496, "args": { "External id": 17222,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10717 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040251.004, "dur": 4.816, "args": { "External id": 17223,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10718 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040255.333, "dur": 0.420, "args": { "External id": 17224,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10719 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040256.165, "dur": 2.202, "args": { "External id": 17225,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10720 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040257.098, "dur": 1.191, "args": { "External id": 17226,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10721 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040258.613, "dur": 1.098, "args": { "External id": 17227,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10722 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040258.972, "dur": 0.669, "args": { "External id": 17228,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10723 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040259.933, "dur": 3.711, "args": { "External id": 17229,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10724 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040263.083, "dur": 0.485, "args": { "External id": 17230,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10725 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040263.865, "dur": 1.067, "args": { "External id": 17231,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10726 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040264.483, "dur": 0.388, "args": { "External id": 17232,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10727 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040265.158, "dur": 2.948, "args": { "External id": 17233,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10728 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040265.842, "dur": 2.186, "args": { "External id": 17234,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10729 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040268.575, "dur": 3.132, "args": { "External id": 17235,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10730 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040270.818, "dur": 0.819, "args": { "External id": 17236,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10731 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040272.333, "dur": 1.421, "args": { "External id": 17237,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10732 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040273.204, "dur": 0.488, "args": { "External id": 17238,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10733 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040276.066, "dur": 4.467, "args": { "External id": 17239,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10734 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040280.145, "dur": 0.319, "args": { "External id": 17240,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10735 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040281.018, "dur": 1.298, "args": { "External id": 17241,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10736 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040281.585, "dur": 0.656, "args": { "External id": 17242,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10737 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040282.977, "dur": 1.169, "args": { "External id": 17243,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10738 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040283.543, "dur": 0.530, "args": { "External id": 17244,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10739 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040284.540, "dur": 3.711, "args": { "External id": 17245,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10740 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040287.646, "dur": 0.538, "args": { "External id": 17246,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10741 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040288.653, "dur": 1.464, "args": { "External id": 17247,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10742 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040289.348, "dur": 0.696, "args": { "External id": 17248,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10743 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040290.516, "dur": 3.613, "args": { "External id": 17249,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10744 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040291.270, "dur": 2.707, "args": { "External id": 17250,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10745 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040294.583, "dur": 2.162, "args": { "External id": 17251,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10746 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040296.065, "dur": 0.613, "args": { "External id": 17252,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10747 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040297.134, "dur": 1.713, "args": { "External id": 17253,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10748 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040297.914, "dur": 0.849, "args": { "External id": 17254,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10749 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040300.732, "dur": 4.064, "args": { "External id": 17255,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10750 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040304.276, "dur": 0.449, "args": { "External id": 17256,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10751 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040305.071, "dur": 1.236, "args": { "External id": 17257,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10752 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040305.731, "dur": 0.512, "args": { "External id": 17258,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10753 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040306.743, "dur": 1.415, "args": { "External id": 17259,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10754 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040307.357, "dur": 0.738, "args": { "External id": 17260,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10755 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040308.597, "dur": 3.359, "args": { "External id": 17261,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10756 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040311.590, "dur": 0.300, "args": { "External id": 17262,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10757 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040312.374, "dur": 1.189, "args": { "External id": 17263,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10758 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040312.784, "dur": 0.716, "args": { "External id": 17264,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10759 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040313.783, "dur": 2.726, "args": { "External id": 17265,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10760 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040314.164, "dur": 2.065, "args": { "External id": 17266,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10761 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040316.807, "dur": 2.393, "args": { "External id": 17267,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10762 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040318.657, "dur": 0.478, "args": { "External id": 17268,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10763 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040319.418, "dur": 1.433, "args": { "External id": 17269,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10764 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040319.792, "dur": 0.992, "args": { "External id": 17270,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10765 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040323.306, "dur": 5.157, "args": { "External id": 17271,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10766 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040327.524, "dur": 0.875, "args": { "External id": 17272,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10767 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040328.811, "dur": 1.867, "args": { "External id": 17273,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10768 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040329.596, "dur": 1.011, "args": { "External id": 17274,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10769 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040331.092, "dur": 1.376, "args": { "External id": 17275,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10770 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040331.695, "dur": 0.696, "args": { "External id": 17276,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10771 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040332.998, "dur": 4.015, "args": { "External id": 17277,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10772 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040336.104, "dur": 0.840, "args": { "External id": 17278,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10773 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040337.450, "dur": 1.323, "args": { "External id": 17279,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10774 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040337.988, "dur": 0.711, "args": { "External id": 17280,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10775 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040338.993, "dur": 3.034, "args": { "External id": 17281,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10776 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040339.484, "dur": 2.475, "args": { "External id": 17282,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10777 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040342.282, "dur": 4.052, "args": { "External id": 17283,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10778 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040345.871, "dur": 0.400, "args": { "External id": 17284,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10779 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040346.795, "dur": 3.109, "args": { "External id": 17285,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10780 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040347.281, "dur": 2.374, "args": { "External id": 17286,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10781 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040352.099, "dur": 3.114, "args": { "External id": 17287,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10782 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040354.346, "dur": 0.798, "args": { "External id": 17288,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10783 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040355.431, "dur": 1.764, "args": { "External id": 17289,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10784 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040355.847, "dur": 1.280, "args": { "External id": 17290,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10785 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040357.415, "dur": 3.185, "args": { "External id": 17291,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10786 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040359.949, "dur": 0.584, "args": { "External id": 17292,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10787 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040361.057, "dur": 1.979, "args": { "External id": 17293,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10788 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040362.567, "dur": 0.400, "args": { "External id": 17294,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10789 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040363.426, "dur": 1.506, "args": { "External id": 17295,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10790 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040364.189, "dur": 0.669, "args": { "External id": 17296,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10791 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040365.400, "dur": 3.884, "args": { "External id": 17297,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10792 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040368.320, "dur": 0.896, "args": { "External id": 17298,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10793 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040369.513, "dur": 1.436, "args": { "External id": 17299,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10794 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040370.194, "dur": 0.688, "args": { "External id": 17300,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10795 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040371.167, "dur": 2.921, "args": { "External id": 17301,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10796 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040371.563, "dur": 2.445, "args": { "External id": 17302,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10797 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040376.299, "dur": 1.612, "args": { "External id": 17303,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10798 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040377.433, "dur": 0.401, "args": { "External id": 17304,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10799 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040378.316, "dur": 1.199, "args": { "External id": 17305,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10800 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040378.817, "dur": 0.622, "args": { "External id": 17306,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10801 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040379.733, "dur": 3.122, "args": { "External id": 17307,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10802 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040382.346, "dur": 0.440, "args": { "External id": 17308,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10803 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040383.137, "dur": 1.407, "args": { "External id": 17309,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10804 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040383.895, "dur": 0.580, "args": { "External id": 17310,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10805 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040384.799, "dur": 1.405, "args": { "External id": 17311,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10806 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040385.572, "dur": 0.568, "args": { "External id": 17312,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10807 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040386.592, "dur": 3.368, "args": { "External id": 17313,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10808 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040389.442, "dur": 0.444, "args": { "External id": 17314,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10809 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040390.556, "dur": 1.476, "args": { "External id": 17315,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10810 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040391.399, "dur": 0.563, "args": { "External id": 17316,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10811 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040392.342, "dur": 2.639, "args": { "External id": 17317,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10812 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040392.821, "dur": 2.089, "args": { "External id": 17318,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10813 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040397.345, "dur": 1.304, "args": { "External id": 17319,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10814 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040398.078, "dur": 0.507, "args": { "External id": 17320,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10815 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040398.923, "dur": 1.023, "args": { "External id": 17321,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10816 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040399.402, "dur": 0.481, "args": { "External id": 17322,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10817 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040400.191, "dur": 3.537, "args": { "External id": 17323,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10818 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040403.181, "dur": 0.483, "args": { "External id": 17324,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10819 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040404.006, "dur": 1.926, "args": { "External id": 17325,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10820 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040405.283, "dur": 0.568, "args": { "External id": 17326,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10821 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040406.386, "dur": 1.431, "args": { "External id": 17327,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10822 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040407.165, "dur": 0.578, "args": { "External id": 17328,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10823 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040408.257, "dur": 3.182, "args": { "External id": 17329,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10824 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040410.869, "dur": 0.495, "args": { "External id": 17330,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10825 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040412.057, "dur": 1.528, "args": { "External id": 17331,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10826 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040412.758, "dur": 0.759, "args": { "External id": 17332,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10827 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040413.809, "dur": 3.026, "args": { "External id": 17333,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10828 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040414.170, "dur": 2.412, "args": { "External id": 17334,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10829 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040419.223, "dur": 1.744, "args": { "External id": 17335,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10830 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040419.916, "dur": 0.983, "args": { "External id": 17336,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10831 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040421.295, "dur": 1.322, "args": { "External id": 17337,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10832 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040421.872, "dur": 0.677, "args": { "External id": 17338,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10833 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040422.846, "dur": 3.117, "args": { "External id": 17339,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10834 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040425.255, "dur": 0.642, "args": { "External id": 17340,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10835 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040426.210, "dur": 1.716, "args": { "External id": 17341,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10836 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040427.130, "dur": 0.725, "args": { "External id": 17342,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10837 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040428.350, "dur": 1.542, "args": { "External id": 17343,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10838 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040428.915, "dur": 0.908, "args": { "External id": 17344,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10839 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040430.133, "dur": 3.223, "args": { "External id": 17345,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10840 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040432.515, "dur": 0.777, "args": { "External id": 17346,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10841 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040433.577, "dur": 1.284, "args": { "External id": 17347,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10842 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040434.412, "dur": 0.383, "args": { "External id": 17348,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10843 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040435.117, "dur": 2.749, "args": { "External id": 17349,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10844 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040435.599, "dur": 2.193, "args": { "External id": 17350,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10845 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040440.296, "dur": 1.770, "args": { "External id": 17351,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10846 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040441.005, "dur": 0.993, "args": { "External id": 17352,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10847 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040442.485, "dur": 1.337, "args": { "External id": 17353,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10848 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040443.256, "dur": 0.496, "args": { "External id": 17354,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10849 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040444.258, "dur": 2.793, "args": { "External id": 17355,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10850 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040446.672, "dur": 0.310, "args": { "External id": 17356,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10851 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040447.296, "dur": 1.550, "args": { "External id": 17357,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10852 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040448.275, "dur": 0.505, "args": { "External id": 17358,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10853 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040449.069, "dur": 1.226, "args": { "External id": 17359,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10854 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040449.693, "dur": 0.535, "args": { "External id": 17360,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10855 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040450.903, "dur": 3.444, "args": { "External id": 17361,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10856 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040453.736, "dur": 0.543, "args": { "External id": 17362,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10857 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040454.573, "dur": 1.515, "args": { "External id": 17363,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10858 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040455.600, "dur": 0.420, "args": { "External id": 17364,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10859 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040456.656, "dur": 3.265, "args": { "External id": 17365,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10860 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040457.251, "dur": 2.418, "args": { "External id": 17366,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10861 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040461.741, "dur": 1.075, "args": { "External id": 17367,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10862 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040462.428, "dur": 0.318, "args": { "External id": 17368,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10863 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040463.260, "dur": 0.971, "args": { "External id": 17369,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10864 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040463.696, "dur": 0.469, "args": { "External id": 17370,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10865 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040464.454, "dur": 2.937, "args": { "External id": 17371,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10866 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040466.905, "dur": 0.421, "args": { "External id": 17372,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10867 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040467.638, "dur": 1.478, "args": { "External id": 17373,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10868 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040468.617, "dur": 0.430, "args": { "External id": 17374,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10869 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040469.337, "dur": 1.019, "args": { "External id": 17375,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10870 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040469.726, "dur": 0.567, "args": { "External id": 17376,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10871 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040470.627, "dur": 3.570, "args": { "External id": 17377,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10872 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040473.286, "dur": 0.849, "args": { "External id": 17378,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10873 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040474.796, "dur": 1.855, "args": { "External id": 17379,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10874 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040475.827, "dur": 0.755, "args": { "External id": 17380,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10875 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040477.047, "dur": 2.950, "args": { "External id": 17381,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10876 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040477.630, "dur": 2.297, "args": { "External id": 17382,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10877 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040482.239, "dur": 1.100, "args": { "External id": 17383,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10878 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040483.047, "dur": 0.227, "args": { "External id": 17384,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10879 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040483.569, "dur": 1.138, "args": { "External id": 17385,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10880 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040483.949, "dur": 0.687, "args": { "External id": 17386,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10881 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040484.951, "dur": 3.099, "args": { "External id": 17387,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10882 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040487.496, "dur": 0.485, "args": { "External id": 17388,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10883 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040488.299, "dur": 1.740, "args": { "External id": 17389,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10884 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040489.161, "dur": 0.809, "args": { "External id": 17390,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10885 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040490.512, "dur": 1.334, "args": { "External id": 17391,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10886 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040491.069, "dur": 0.713, "args": { "External id": 17392,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10887 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040492.081, "dur": 3.572, "args": { "External id": 17393,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10888 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040494.772, "dur": 0.816, "args": { "External id": 17394,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10889 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040496.051, "dur": 1.464, "args": { "External id": 17395,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10890 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040496.783, "dur": 0.665, "args": { "External id": 17396,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10891 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040497.904, "dur": 3.414, "args": { "External id": 17397,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10892 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040498.665, "dur": 2.579, "args": { "External id": 17398,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10893 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040503.456, "dur": 1.343, "args": { "External id": 17399,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10894 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040504.099, "dur": 0.632, "args": { "External id": 17400,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10895 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040505.020, "dur": 1.575, "args": { "External id": 17401,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10896 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040505.410, "dur": 1.119, "args": { "External id": 17402,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10897 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040507.001, "dur": 2.729, "args": { "External id": 17403,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10898 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040509.396, "dur": 0.267, "args": { "External id": 17404,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10899 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040509.981, "dur": 1.445, "args": { "External id": 17405,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10900 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040510.816, "dur": 0.541, "args": { "External id": 17406,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10901 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040511.832, "dur": 1.086, "args": { "External id": 17407,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10902 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040512.349, "dur": 0.503, "args": { "External id": 17408,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10903 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040539.475, "dur": 3.902, "args": { "External id": 23553,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10904 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040541.901, "dur": 1.402, "args": { "External id": 23554,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10905 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040543.641, "dur": 1.295, "args": { "External id": 23555,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10906 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040544.460, "dur": 0.403, "args": { "External id": 23556,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10907 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040545.163, "dur": 3.382, "args": { "External id": 23557,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10908 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040545.531, "dur": 2.939, "args": { "External id": 23558,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10909 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040550.670, "dur": 1.051, "args": { "External id": 23559,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10910 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040551.145, "dur": 0.504, "args": { "External id": 23560,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10911 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040551.960, "dur": 1.545, "args": { "External id": 23561,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10912 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040553.018, "dur": 0.418, "args": { "External id": 23562,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10913 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040553.935, "dur": 3.676, "args": { "External id": 23563,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10914 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040556.747, "dur": 0.796, "args": { "External id": 23564,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10915 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040557.891, "dur": 1.303, "args": { "External id": 23565,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10916 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040558.874, "dur": 0.253, "args": { "External id": 23566,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10917 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040559.456, "dur": 1.656, "args": { "External id": 23567,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10918 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040560.478, "dur": 0.569, "args": { "External id": 23568,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10919 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040561.562, "dur": 3.287, "args": { "External id": 23569,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10920 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040564.379, "dur": 0.403, "args": { "External id": 23570,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10921 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040565.105, "dur": 1.173, "args": { "External id": 23571,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10922 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040565.915, "dur": 0.296, "args": { "External id": 23572,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10923 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040566.518, "dur": 2.916, "args": { "External id": 23573,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10924 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040567.187, "dur": 2.176, "args": { "External id": 23574,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10925 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040571.301, "dur": 1.106, "args": { "External id": 23575,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10926 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040572.034, "dur": 0.303, "args": { "External id": 23576,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10927 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040572.855, "dur": 1.397, "args": { "External id": 23577,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10928 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040573.755, "dur": 0.425, "args": { "External id": 23578,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10929 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040574.494, "dur": 2.785, "args": { "External id": 23579,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10930 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040576.791, "dur": 0.420, "args": { "External id": 23580,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10931 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040577.542, "dur": 1.607, "args": { "External id": 23581,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10932 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040578.564, "dur": 0.518, "args": { "External id": 23582,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10933 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040579.391, "dur": 1.156, "args": { "External id": 23583,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10934 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040580.131, "dur": 0.348, "args": { "External id": 23584,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10935 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040580.789, "dur": 3.000, "args": { "External id": 23585,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10936 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040583.402, "dur": 0.320, "args": { "External id": 23586,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10937 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040584.031, "dur": 1.060, "args": { "External id": 23587,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10938 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040584.721, "dur": 0.304, "args": { "External id": 23588,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10939 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040585.382, "dur": 2.867, "args": { "External id": 23589,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10940 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040585.848, "dur": 2.232, "args": { "External id": 23590,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10941 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040590.801, "dur": 1.046, "args": { "External id": 23591,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10942 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040591.326, "dur": 0.452, "args": { "External id": 23592,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10943 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040592.273, "dur": 0.912, "args": { "External id": 23593,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10944 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040592.736, "dur": 0.378, "args": { "External id": 23594,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10945 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040593.646, "dur": 3.494, "args": { "External id": 23595,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10946 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040596.653, "dur": 0.417, "args": { "External id": 23596,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10947 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040597.405, "dur": 0.911, "args": { "External id": 23597,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10948 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040597.879, "dur": 0.371, "args": { "External id": 23598,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10949 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040598.557, "dur": 1.276, "args": { "External id": 23599,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10950 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040599.213, "dur": 0.552, "args": { "External id": 23600,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10951 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040600.280, "dur": 3.244, "args": { "External id": 23601,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10952 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040602.984, "dur": 0.474, "args": { "External id": 23602,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10953 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040603.769, "dur": 0.875, "args": { "External id": 23603,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10954 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040604.245, "dur": 0.330, "args": { "External id": 23604,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10955 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040604.884, "dur": 2.636, "args": { "External id": 23605,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10956 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040605.306, "dur": 2.140, "args": { "External id": 23606,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10957 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040609.306, "dur": 0.916, "args": { "External id": 23607,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10958 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040609.868, "dur": 0.280, "args": { "External id": 23608,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10959 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040610.564, "dur": 1.043, "args": { "External id": 23609,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10960 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040611.031, "dur": 0.511, "args": { "External id": 23610,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10961 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040612.018, "dur": 2.871, "args": { "External id": 23611,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10962 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040614.461, "dur": 0.363, "args": { "External id": 23612,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10963 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040615.173, "dur": 0.832, "args": { "External id": 23613,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10964 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040615.655, "dur": 0.283, "args": { "External id": 23614,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10965 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040616.268, "dur": 0.932, "args": { "External id": 23615,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10966 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040616.692, "dur": 0.440, "args": { "External id": 23616,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10967 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040617.473, "dur": 2.613, "args": { "External id": 23617,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10968 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040619.743, "dur": 0.279, "args": { "External id": 23618,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10969 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040620.326, "dur": 1.027, "args": { "External id": 23619,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10970 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040620.786, "dur": 0.506, "args": { "External id": 23620,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10971 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040621.595, "dur": 2.789, "args": { "External id": 23621,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10972 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040622.075, "dur": 2.238, "args": { "External id": 23622,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10973 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040626.458, "dur": 0.860, "args": { "External id": 23623,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10974 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040626.925, "dur": 0.328, "args": { "External id": 23624,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10975 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040627.674, "dur": 1.065, "args": { "External id": 23625,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10976 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040628.137, "dur": 0.534, "args": { "External id": 23626,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10977 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040629.198, "dur": 3.222, "args": { "External id": 23627,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10978 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040631.753, "dur": 0.602, "args": { "External id": 23628,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10979 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040632.721, "dur": 0.815, "args": { "External id": 23629,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10980 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040633.194, "dur": 0.276, "args": { "External id": 23630,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10981 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040633.778, "dur": 1.031, "args": { "External id": 23631,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10982 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040634.222, "dur": 0.522, "args": { "External id": 23632,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10983 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040635.145, "dur": 3.106, "args": { "External id": 23633,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10984 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040637.851, "dur": 0.334, "args": { "External id": 23634,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10985 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040638.491, "dur": 1.044, "args": { "External id": 23635,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10986 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040639.113, "dur": 0.356, "args": { "External id": 23636,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10987 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040639.771, "dur": 2.873, "args": { "External id": 23637,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10988 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040640.282, "dur": 2.291, "args": { "External id": 23638,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10989 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040644.778, "dur": 0.835, "args": { "External id": 23639,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10990 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040645.211, "dur": 0.337, "args": { "External id": 23640,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10991 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040645.855, "dur": 0.830, "args": { "External id": 23641,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10992 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040646.306, "dur": 0.316, "args": { "External id": 23642,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10993 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040647.171, "dur": 3.251, "args": { "External id": 23643,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10994 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040650.078, "dur": 0.279, "args": { "External id": 23644,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10995 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040650.688, "dur": 1.035, "args": { "External id": 23645,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10996 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040651.262, "dur": 0.394, "args": { "External id": 23646,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10997 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040651.975, "dur": 0.929, "args": { "External id": 23647,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 10998 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040652.470, "dur": 0.367, "args": { "External id": 23648,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 10999 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040653.145, "dur": 3.063, "args": { "External id": 23649,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11000 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040655.836, "dur": 0.306, "args": { "External id": 23650,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11001 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040656.461, "dur": 0.951, "args": { "External id": 23651,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11002 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040657.041, "dur": 0.308, "args": { "External id": 23652,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11003 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040657.670, "dur": 2.778, "args": { "External id": 23653,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11004 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040658.235, "dur": 2.143, "args": { "External id": 23654,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11005 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040662.543, "dur": 0.977, "args": { "External id": 23655,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11006 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040663.187, "dur": 0.270, "args": { "External id": 23656,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11007 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040663.761, "dur": 0.842, "args": { "External id": 23657,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11008 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040664.212, "dur": 0.323, "args": { "External id": 23658,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11009 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040664.847, "dur": 3.602, "args": { "External id": 23659,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11010 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040668.092, "dur": 0.283, "args": { "External id": 23660,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11011 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040668.756, "dur": 0.918, "args": { "External id": 23661,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11012 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040669.277, "dur": 0.333, "args": { "External id": 23662,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11013 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040670.114, "dur": 0.881, "args": { "External id": 23663,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11014 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040670.611, "dur": 0.321, "args": { "External id": 23664,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11015 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040671.235, "dur": 3.025, "args": { "External id": 23665,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11016 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040673.751, "dur": 0.440, "args": { "External id": 23666,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11017 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040674.500, "dur": 1.004, "args": { "External id": 23667,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11018 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040675.102, "dur": 0.338, "args": { "External id": 23668,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11019 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040675.749, "dur": 3.026, "args": { "External id": 23669,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11020 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040676.453, "dur": 2.251, "args": { "External id": 23670,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11021 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040681.002, "dur": 0.873, "args": { "External id": 23671,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11022 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040681.495, "dur": 0.311, "args": { "External id": 23672,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11023 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040682.114, "dur": 1.004, "args": { "External id": 23673,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11024 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040682.559, "dur": 0.491, "args": { "External id": 23674,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11025 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040683.544, "dur": 3.176, "args": { "External id": 23675,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11026 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040686.293, "dur": 0.360, "args": { "External id": 23676,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11027 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040687.017, "dur": 0.811, "args": { "External id": 23677,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11028 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040687.455, "dur": 0.311, "args": { "External id": 23678,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11029 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040688.068, "dur": 0.845, "args": { "External id": 23679,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11030 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040688.489, "dur": 0.360, "args": { "External id": 23680,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11031 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040689.384, "dur": 2.964, "args": { "External id": 23681,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11032 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040691.977, "dur": 0.309, "args": { "External id": 23682,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11033 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040692.588, "dur": 2.565, "args": { "External id": 23683,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11034 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040694.773, "dur": 0.313, "args": { "External id": 23684,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11035 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040695.395, "dur": 3.200, "args": { "External id": 23685,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11036 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040695.844, "dur": 2.498, "args": { "External id": 23686,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11037 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040700.724, "dur": 1.110, "args": { "External id": 23687,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11038 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040701.161, "dur": 0.610, "args": { "External id": 23688,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11039 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040702.075, "dur": 1.166, "args": { "External id": 23689,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11040 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040702.774, "dur": 0.402, "args": { "External id": 23690,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11041 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040703.497, "dur": 2.937, "args": { "External id": 23691,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11042 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040706.068, "dur": 0.298, "args": { "External id": 23692,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11043 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040706.697, "dur": 0.838, "args": { "External id": 23693,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11044 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040707.134, "dur": 0.335, "args": { "External id": 23694,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11045 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040707.805, "dur": 1.135, "args": { "External id": 23695,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11046 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040708.468, "dur": 0.397, "args": { "External id": 23696,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11047 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040709.188, "dur": 2.963, "args": { "External id": 23697,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11048 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040711.782, "dur": 0.300, "args": { "External id": 23698,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11049 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040712.614, "dur": 0.892, "args": { "External id": 23699,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11050 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040713.052, "dur": 0.382, "args": { "External id": 23700,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11051 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040713.758, "dur": 2.883, "args": { "External id": 23701,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11052 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040714.180, "dur": 2.194, "args": { "External id": 23702,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11053 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040718.914, "dur": 0.863, "args": { "External id": 23703,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11054 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040719.428, "dur": 0.282, "args": { "External id": 23704,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11055 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040720.334, "dur": 0.890, "args": { "External id": 23705,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11056 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040720.804, "dur": 0.356, "args": { "External id": 23706,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11057 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040721.466, "dur": 2.815, "args": { "External id": 23707,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11058 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040723.892, "dur": 0.322, "args": { "External id": 23708,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11059 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040724.545, "dur": 0.783, "args": { "External id": 23709,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11060 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040725.000, "dur": 0.261, "args": { "External id": 23710,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11061 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040725.572, "dur": 1.112, "args": { "External id": 23711,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11062 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040726.182, "dur": 0.431, "args": { "External id": 23712,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11063 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040726.945, "dur": 3.463, "args": { "External id": 23713,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11064 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040729.937, "dur": 0.403, "args": { "External id": 23714,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11065 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040730.857, "dur": 0.804, "args": { "External id": 23715,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11066 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040731.319, "dur": 0.280, "args": { "External id": 23716,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11067 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040731.902, "dur": 2.639, "args": { "External id": 23717,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11068 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040732.413, "dur": 2.055, "args": { "External id": 23718,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11069 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040736.851, "dur": 0.832, "args": { "External id": 23719,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11070 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040737.310, "dur": 0.307, "args": { "External id": 23720,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11071 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040738.146, "dur": 1.293, "args": { "External id": 23721,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11072 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040739.017, "dur": 0.358, "args": { "External id": 23722,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11073 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040739.681, "dur": 2.763, "args": { "External id": 23723,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11074 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040742.099, "dur": 0.277, "args": { "External id": 23724,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11075 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040742.719, "dur": 0.813, "args": { "External id": 23725,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11076 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040743.204, "dur": 0.264, "args": { "External id": 23726,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11077 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040743.797, "dur": 0.982, "args": { "External id": 23727,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11078 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040744.246, "dur": 0.464, "args": { "External id": 23728,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11079 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040745.021, "dur": 2.704, "args": { "External id": 23729,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11080 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040747.372, "dur": 0.286, "args": { "External id": 23730,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11081 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040748.193, "dur": 0.969, "args": { "External id": 23731,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11082 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040748.670, "dur": 0.422, "args": { "External id": 23732,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11083 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040749.414, "dur": 2.981, "args": { "External id": 23733,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11084 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040749.854, "dur": 2.473, "args": { "External id": 23734,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11085 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040754.325, "dur": 0.941, "args": { "External id": 23735,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11086 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040754.785, "dur": 0.416, "args": { "External id": 23736,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11087 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040755.724, "dur": 0.795, "args": { "External id": 23737,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11088 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040756.167, "dur": 0.287, "args": { "External id": 23738,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11089 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040756.801, "dur": 2.808, "args": { "External id": 23739,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11090 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040759.307, "dur": 0.239, "args": { "External id": 23740,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11091 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040759.876, "dur": 0.754, "args": { "External id": 23741,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11092 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040760.327, "dur": 0.238, "args": { "External id": 23742,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11093 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040760.879, "dur": 0.803, "args": { "External id": 23743,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11094 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040761.331, "dur": 0.287, "args": { "External id": 23744,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11095 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040762.023, "dur": 2.628, "args": { "External id": 23745,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11096 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040764.338, "dur": 0.250, "args": { "External id": 23746,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11097 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040764.901, "dur": 0.918, "args": { "External id": 23747,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11098 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040765.332, "dur": 0.425, "args": { "External id": 23748,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11099 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040766.381, "dur": 2.600, "args": { "External id": 23749,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11100 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040766.810, "dur": 2.104, "args": { "External id": 23750,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11101 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040770.861, "dur": 0.953, "args": { "External id": 23751,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11102 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040771.320, "dur": 0.423, "args": { "External id": 23752,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11103 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040772.173, "dur": 0.931, "args": { "External id": 23753,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11104 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040772.624, "dur": 0.415, "args": { "External id": 23754,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11105 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040773.541, "dur": 2.986, "args": { "External id": 23755,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11106 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040776.171, "dur": 0.293, "args": { "External id": 23756,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11107 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040776.793, "dur": 0.766, "args": { "External id": 23757,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11108 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040777.235, "dur": 0.263, "args": { "External id": 23758,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11109 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040777.803, "dur": 1.016, "args": { "External id": 23759,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11110 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040778.238, "dur": 0.513, "args": { "External id": 23760,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11111 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040779.130, "dur": 2.704, "args": { "External id": 23761,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11112 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040781.538, "dur": 0.220, "args": { "External id": 23762,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11113 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040782.253, "dur": 1.312, "args": { "External id": 23763,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11114 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040782.754, "dur": 0.740, "args": { "External id": 23764,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11115 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040783.806, "dur": 2.993, "args": { "External id": 23765,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11116 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040784.701, "dur": 2.031, "args": { "External id": 23766,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11117 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040788.942, "dur": 1.191, "args": { "External id": 23767,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11118 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040789.404, "dur": 0.664, "args": { "External id": 23768,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11119 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040790.373, "dur": 1.592, "args": { "External id": 23769,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11120 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040790.969, "dur": 0.932, "args": { "External id": 23770,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11121 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040792.296, "dur": 3.417, "args": { "External id": 23771,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11122 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040794.943, "dur": 0.706, "args": { "External id": 23772,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11123 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040795.979, "dur": 1.240, "args": { "External id": 23773,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11124 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040796.389, "dur": 0.761, "args": { "External id": 23774,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11125 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040797.462, "dur": 1.490, "args": { "External id": 23775,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11126 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040798.089, "dur": 0.800, "args": { "External id": 23776,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11127 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040799.426, "dur": 2.950, "args": { "External id": 23777,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11128 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040801.669, "dur": 0.637, "args": { "External id": 23778,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11129 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040802.617, "dur": 1.784, "args": { "External id": 23779,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11130 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040803.308, "dur": 1.023, "args": { "External id": 23780,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11131 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040804.961, "dur": 2.668, "args": { "External id": 23781,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11132 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040805.376, "dur": 2.186, "args": { "External id": 23782,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11133 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040810.138, "dur": 1.356, "args": { "External id": 23783,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11134 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040810.755, "dur": 0.673, "args": { "External id": 23784,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11135 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040811.732, "dur": 1.268, "args": { "External id": 23785,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11136 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040812.173, "dur": 0.761, "args": { "External id": 23786,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11137 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040813.267, "dur": 3.230, "args": { "External id": 23787,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11138 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040815.843, "dur": 0.586, "args": { "External id": 23788,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11139 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040816.760, "dur": 1.454, "args": { "External id": 23789,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11140 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040817.408, "dur": 0.736, "args": { "External id": 23790,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11141 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040818.539, "dur": 1.791, "args": { "External id": 23791,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11142 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040819.199, "dur": 1.064, "args": { "External id": 23792,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11143 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040820.721, "dur": 3.971, "args": { "External id": 23793,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11144 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040823.774, "dur": 0.852, "args": { "External id": 23794,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11145 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040824.965, "dur": 1.494, "args": { "External id": 23795,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11146 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040825.616, "dur": 0.775, "args": { "External id": 23796,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11147 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040826.681, "dur": 3.254, "args": { "External id": 23797,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11148 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040827.695, "dur": 2.172, "args": { "External id": 23798,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11149 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040832.091, "dur": 1.225, "args": { "External id": 23799,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11150 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040832.720, "dur": 0.532, "args": { "External id": 23800,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11151 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040833.803, "dur": 2.221, "args": { "External id": 23801,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11152 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040834.880, "dur": 1.080, "args": { "External id": 23802,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11153 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040836.269, "dur": 3.447, "args": { "External id": 23803,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11154 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040838.802, "dur": 0.845, "args": { "External id": 23804,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11155 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040839.987, "dur": 2.153, "args": { "External id": 23805,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11156 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040841.146, "dur": 0.926, "args": { "External id": 23806,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11157 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040842.392, "dur": 1.175, "args": { "External id": 23807,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11158 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040842.817, "dur": 0.684, "args": { "External id": 23808,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11159 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040843.794, "dur": 4.148, "args": { "External id": 23809,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11160 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040846.927, "dur": 0.950, "args": { "External id": 23810,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11161 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040848.184, "dur": 1.229, "args": { "External id": 23811,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11162 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040848.726, "dur": 0.613, "args": { "External id": 23812,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11163 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040849.642, "dur": 3.418, "args": { "External id": 23813,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11164 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040850.765, "dur": 2.223, "args": { "External id": 23814,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11165 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040855.443, "dur": 1.722, "args": { "External id": 23815,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11166 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040856.097, "dur": 1.002, "args": { "External id": 23816,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11167 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040857.392, "dur": 1.895, "args": { "External id": 23817,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11168 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040858.263, "dur": 0.955, "args": { "External id": 23818,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11169 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040859.535, "dur": 3.361, "args": { "External id": 23819,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11170 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040862.218, "dur": 0.609, "args": { "External id": 23820,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11171 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040863.142, "dur": 1.950, "args": { "External id": 23821,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11172 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040864.152, "dur": 0.873, "args": { "External id": 23822,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11173 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040865.333, "dur": 1.659, "args": { "External id": 23823,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11174 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040865.962, "dur": 0.964, "args": { "External id": 23824,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11175 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040867.418, "dur": 4.081, "args": { "External id": 23825,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11176 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040870.394, "dur": 1.035, "args": { "External id": 23826,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11177 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040871.766, "dur": 1.107, "args": { "External id": 23827,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11178 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040872.224, "dur": 0.577, "args": { "External id": 23828,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11179 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040873.120, "dur": 3.261, "args": { "External id": 23829,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11180 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040874.252, "dur": 2.057, "args": { "External id": 23830,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11181 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040878.196, "dur": 1.111, "args": { "External id": 23831,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11182 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040878.768, "dur": 0.476, "args": { "External id": 23832,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11183 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040879.531, "dur": 1.609, "args": { "External id": 23833,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11184 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040880.294, "dur": 0.781, "args": { "External id": 23834,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11185 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040881.584, "dur": 3.399, "args": { "External id": 23835,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11186 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040884.221, "dur": 0.696, "args": { "External id": 23836,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11187 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040885.228, "dur": 1.703, "args": { "External id": 23837,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11188 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040886.284, "dur": 0.578, "args": { "External id": 23838,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11189 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040887.205, "dur": 1.301, "args": { "External id": 23839,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11190 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040887.752, "dur": 0.678, "args": { "External id": 23840,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11191 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040888.730, "dur": 3.593, "args": { "External id": 23841,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11192 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040891.572, "dur": 0.682, "args": { "External id": 23842,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11193 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040892.563, "dur": 1.804, "args": { "External id": 23843,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11194 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040893.171, "dur": 1.128, "args": { "External id": 23844,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11195 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040894.600, "dur": 3.483, "args": { "External id": 23845,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11196 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040895.576, "dur": 2.437, "args": { "External id": 23846,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11197 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040900.009, "dur": 1.529, "args": { "External id": 23847,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11198 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040900.658, "dur": 0.815, "args": { "External id": 23848,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11199 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040901.943, "dur": 1.783, "args": { "External id": 23849,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11200 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040902.909, "dur": 0.751, "args": { "External id": 23850,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11201 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040903.998, "dur": 3.339, "args": { "External id": 23851,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11202 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040906.316, "dur": 0.955, "args": { "External id": 23852,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11203 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040907.581, "dur": 1.839, "args": { "External id": 23853,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11204 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040908.500, "dur": 0.851, "args": { "External id": 23854,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11205 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040909.869, "dur": 1.398, "args": { "External id": 23855,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11206 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040910.467, "dur": 0.736, "args": { "External id": 23856,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11207 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040911.492, "dur": 4.276, "args": { "External id": 23857,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11208 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040914.828, "dur": 0.863, "args": { "External id": 23858,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11209 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040916.016, "dur": 1.322, "args": { "External id": 23859,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11210 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040916.624, "dur": 0.645, "args": { "External id": 23860,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11211 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040917.562, "dur": 3.670, "args": { "External id": 23861,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11212 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040918.783, "dur": 2.380, "args": { "External id": 23862,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11213 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040923.356, "dur": 1.512, "args": { "External id": 23863,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11214 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040923.978, "dur": 0.826, "args": { "External id": 23864,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11215 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040925.093, "dur": 2.371, "args": { "External id": 23865,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11216 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040926.253, "dur": 1.145, "args": { "External id": 23866,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11217 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040927.718, "dur": 3.791, "args": { "External id": 23867,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11218 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040930.586, "dur": 0.854, "args": { "External id": 23868,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11219 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040931.753, "dur": 1.549, "args": { "External id": 23869,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11220 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040932.598, "dur": 0.636, "args": { "External id": 23870,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11221 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040933.544, "dur": 1.931, "args": { "External id": 23871,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11222 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040934.402, "dur": 0.999, "args": { "External id": 23872,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11223 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040935.700, "dur": 3.962, "args": { "External id": 23873,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11224 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040938.736, "dur": 0.863, "args": { "External id": 23874,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11225 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040939.910, "dur": 1.377, "args": { "External id": 23875,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11226 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040940.528, "dur": 0.693, "args": { "External id": 23876,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11227 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040941.538, "dur": 3.173, "args": { "External id": 23877,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11228 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040942.370, "dur": 2.088, "args": { "External id": 23878,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11229 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040946.712, "dur": 1.335, "args": { "External id": 23879,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11230 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040947.315, "dur": 0.668, "args": { "External id": 23880,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11231 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040948.464, "dur": 1.748, "args": { "External id": 23881,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11232 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040949.236, "dur": 0.911, "args": { "External id": 23882,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11233 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040950.502, "dur": 3.384, "args": { "External id": 23883,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11234 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040953.213, "dur": 0.605, "args": { "External id": 23884,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11235 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040954.138, "dur": 2.328, "args": { "External id": 23885,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11236 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040955.424, "dur": 0.976, "args": { "External id": 23886,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11237 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040956.910, "dur": 1.363, "args": { "External id": 23887,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11238 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040957.333, "dur": 0.874, "args": { "External id": 23888,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11239 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040958.502, "dur": 3.941, "args": { "External id": 23889,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11240 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040961.613, "dur": 0.765, "args": { "External id": 23890,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11241 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040962.799, "dur": 1.187, "args": { "External id": 23891,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11242 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040963.415, "dur": 0.503, "args": { "External id": 23892,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11243 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040964.338, "dur": 3.040, "args": { "External id": 23893,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11244 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040965.150, "dur": 2.155, "args": { "External id": 23894,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11245 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040969.385, "dur": 1.234, "args": { "External id": 23895,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11246 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040970.020, "dur": 0.533, "args": { "External id": 23896,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11247 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040970.843, "dur": 1.560, "args": { "External id": 23897,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11248 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040971.645, "dur": 0.684, "args": { "External id": 23898,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11249 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040972.659, "dur": 3.478, "args": { "External id": 23899,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11250 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040975.326, "dur": 0.743, "args": { "External id": 23900,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11251 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040976.413, "dur": 1.404, "args": { "External id": 23901,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11252 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040977.258, "dur": 0.492, "args": { "External id": 23902,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11253 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040978.056, "dur": 1.343, "args": { "External id": 23903,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11254 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652040978.473, "dur": 0.865, "args": { "External id": 23904,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11255 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652040979.625, "dur": 30.030, "args": { "External id": 23905,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11256 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041008.154, "dur": 0.989, "args": { "External id": 23906,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11257 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041010.624, "dur": 1.486, "args": { "External id": 23907,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11258 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041011.432, "dur": 0.605, "args": { "External id": 23908,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11259 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041012.370, "dur": 3.229, "args": { "External id": 23909,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11260 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041013.353, "dur": 2.170, "args": { "External id": 23910,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11261 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041017.416, "dur": 1.282, "args": { "External id": 23911,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11262 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041017.883, "dur": 0.753, "args": { "External id": 23912,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11263 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041018.943, "dur": 2.135, "args": { "External id": 23913,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11264 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041019.945, "dur": 1.059, "args": { "External id": 23914,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11265 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041021.569, "dur": 3.294, "args": { "External id": 23915,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11266 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041024.052, "dur": 0.735, "args": { "External id": 23916,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11267 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041025.133, "dur": 2.363, "args": { "External id": 23917,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11268 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041026.355, "dur": 1.071, "args": { "External id": 23918,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11269 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041027.827, "dur": 1.549, "args": { "External id": 23919,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11270 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041028.493, "dur": 0.810, "args": { "External id": 23920,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11271 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041029.812, "dur": 3.544, "args": { "External id": 23921,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11272 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041032.626, "dur": 0.665, "args": { "External id": 23922,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11273 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041033.839, "dur": 1.118, "args": { "External id": 23923,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11274 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041034.270, "dur": 0.614, "args": { "External id": 23924,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11275 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041035.209, "dur": 3.702, "args": { "External id": 23925,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11276 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041036.502, "dur": 2.332, "args": { "External id": 23926,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11277 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041040.966, "dur": 1.424, "args": { "External id": 23927,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11278 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041041.662, "dur": 0.656, "args": { "External id": 23928,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11279 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041042.668, "dur": 1.811, "args": { "External id": 23929,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11280 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041043.672, "dur": 0.736, "args": { "External id": 23930,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11281 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041044.738, "dur": 3.997, "args": { "External id": 23931,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11282 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041047.776, "dur": 0.899, "args": { "External id": 23932,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11283 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041049.026, "dur": 1.940, "args": { "External id": 23933,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11284 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041050.227, "dur": 0.678, "args": { "External id": 23934,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11285 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041051.228, "dur": 1.472, "args": { "External id": 23935,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11286 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041051.878, "dur": 0.754, "args": { "External id": 23936,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11287 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041052.986, "dur": 4.353, "args": { "External id": 23937,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11288 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041056.350, "dur": 0.924, "args": { "External id": 23938,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11289 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::unsqueeze", "pid": 1336754, "tid": 1336754, "ts": 1295652041058.014, "dur": 2.913, "args": { "External id": 23939,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11290 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041060.252, "dur": 0.608, "args": { "External id": 23940,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[1]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11291 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::cat", "pid": 1336754, "tid": 1336754, "ts": 1295652041080.040, "dur": 128.075, "args": { "External id": 23941,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11292 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336754, "tid": 1336754, "ts": 1295652041326.784, "dur": 138.481, "args": { "External id": 23942,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11293 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::linalg_vector_norm", "pid": 1336754, "tid": 1336754, "ts": 1295652041389.344, "dur": 54.685, "args": { "External id": 23943,"Record function id": 0, "Concrete Inputs": ["", "2.", "", "False", ""], "Input type": ["float", "Scalar", "", "Scalar", ""], "Input Strides": [[1], [], [], [], []], "Input Dims": [[291], [], [], [], []], "Ev Idx": 11294 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::as_strided", "pid": 1336754, "tid": 1336754, "ts": 1295652041404.289, "dur": 1.119, "args": { "External id": 23944,"Record function id": 0, "Concrete Inputs": ["", "[1]", "[0]", ""], "Input type": ["float", "ScalarList", "ScalarList", ""], "Input Strides": [[], [], [], []], "Input Dims": [[], [], [], []], "Ev Idx": 11295 } }, { "ph": "X", "cat": "cpu_op", "name": "Redistribute", "pid": 1336754, "tid": 1336754, "ts": 1295652041891.688, "dur": 990.670, "args": { "External id": 23945,"Sequence number": 246776, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", "False"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11296 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336754, "tid": 1336754, "ts": 1295652041945.771, "dur": 140.589, "args": { "External id": 23946,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11297 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652041949.884, "dur": 1.638, "args": { "External id": 23947,"Record function id": 0, "Concrete Inputs": ["", "2."], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11298 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652042034.932, "dur": 1.471, "args": { "External id": 23948,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11299 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::all_reduce", "pid": 1336754, "tid": 1336754, "ts": 1295652042114.358, "dur": 449.890, "args": { "External id": 23949,"Record function id": 0, "Concrete Inputs": ["", "", ""], "Input type": ["float", "", ""], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11300 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clone", "pid": 1336754, "tid": 1336754, "ts": 1295652042118.280, "dur": 49.018, "args": { "External id": 23950,"Record function id": 0, "Concrete Inputs": ["", "0"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11301 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty_like", "pid": 1336754, "tid": 1336754, "ts": 1295652042121.759, "dur": 11.219, "args": { "External id": 23951,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "0"], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11302 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295652042127.702, "dur": 4.508, "args": { "External id": 23952,"Record function id": 0, "Concrete Inputs": ["[]", "6", "0", "", "", "0"], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", "Scalar"], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11303 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::copy_", "pid": 1336754, "tid": 1336754, "ts": 1295652042134.469, "dur": 32.284, "args": { "External id": 23953,"Record function id": 0, "Concrete Inputs": ["", "", "False"], "Input type": ["float", "float", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11304 } }, { "ph": "X", "cat": "cpu_op", "name": "c10d::allreduce_", "pid": 1336754, "tid": 1336754, "ts": 1295652042177.452, "dur": 383.611, "args": { "External id": 23954,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "-1"], "Input type": ["TensorList", "", "", "", "Scalar"], "Input Strides": [[[]], [], [], [], []], "Input Dims": [[[]], [], [], [], []], "Ev Idx": 11305 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295652042209.353, "dur": 344.806, "args": { "External id": 23955,"Record function id": 0, "Collective name": "allreduce", "Process Group Description": "default_pg", "dtype": "Float", "Rank": 1, "Input Strides": [[[]], [], [], [], [], [], [], [], [], []], "Concrete Inputs": ["", "", "", "1", "", "[]", "[]", "0", "1", "8"], "Out msg nelems": 1, "Process Group Name": "0", "Input type": ["TensorList", "", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Global rank stride": 1, "Out split size": "[]", "In split size": "[]", "Process Group Ranks": "[0, 1, 2, 3, 4, 5, 6, 7]", "Group size": 8, "Input Dims": [[[]], [], [], [], [], [], [], [], [], []], "Global rank start": 0, "Ev Idx": 11306, "In msg nelems": 1 } }, { "ph": "X", "cat": "user_annotation", "name": "nccl:all_reduce", "pid": 1336754, "tid": 1336754, "ts": 1295652042227.910, "dur": 320.340, "args": { "External id": 23956,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11307 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336754, "tid": 1336754, "ts": 1295652042632.661, "dur": 208.926, "args": { "External id": 23957,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11308 } }, { "ph": "X", "cat": "cpu_op", "name": "_c10d_functional::wait_tensor", "pid": 1336754, "tid": 1336754, "ts": 1295652042726.537, "dur": 33.319, "args": { "External id": 23958,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11309 } }, { "ph": "X", "cat": "cpu_op", "name": "record_param_comms", "pid": 1336754, "tid": 1336754, "ts": 1295652042747.176, "dur": 4.526, "args": { "External id": 23959,"Record function id": 0, "Collective name": "wait", "Process Group Description": "default_pg", "dtype": "Byte", "Input Dims": [[], [], [], [], [], [], [], [], []], "Input Strides": [[], [], [], [], [], [], [], [], []], "Input type": ["", "", "Scalar", "", "ScalarList", "ScalarList", "Scalar", "Scalar", "Scalar"], "Concrete Inputs": ["", "", "1", "", "[]", "[]", "-1", "-1", "1"], "Out msg nelems": 0, "Process Group Name": "0", "Process Group Ranks": "[]", "Group size": 1, "Ev Idx": 11310, "In msg nelems": 0, "Rank": 1, "In split size": "[]", "Out split size": "[]" } }, { "ph": "X", "cat": "cpu_op", "name": "aten::pow", "pid": 1336754, "tid": 1336754, "ts": 1295652042789.084, "dur": 46.535, "args": { "External id": 23960,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11311 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652042792.090, "dur": 0.934, "args": { "External id": 23961,"Record function id": 0, "Concrete Inputs": ["", "0.5"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11312 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652042794.746, "dur": 0.500, "args": { "External id": 23962,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11313 } }, { "ph": "X", "cat": "cpu_op", "name": "_ToTorchTensor", "pid": 1336754, "tid": 1336754, "ts": 1295652042898.050, "dur": 22.860, "args": { "External id": 23963,"Sequence number": 246777, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", ""], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11314 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view_as", "pid": 1336754, "tid": 1336754, "ts": 1295652042909.340, "dur": 8.462, "args": { "External id": 23964,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11315 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::view", "pid": 1336754, "tid": 1336754, "ts": 1295652042911.901, "dur": 5.750, "args": { "External id": 23965,"Record function id": 0, "Concrete Inputs": ["", "[]"], "Input type": ["float", "ScalarList"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11316 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::add", "pid": 1336754, "tid": 1336754, "ts": 1295652043368.777, "dur": 42.664, "args": { "External id": 23966,"Record function id": 0, "Concrete Inputs": ["", "", "1"], "Input type": ["float", "double", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11317 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::reciprocal", "pid": 1336754, "tid": 1336754, "ts": 1295652043420.868, "dur": 24.616, "args": { "External id": 23967,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11318 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::mul", "pid": 1336754, "tid": 1336754, "ts": 1295652043452.744, "dur": 25.518, "args": { "External id": 23968,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "double"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11319 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::clamp", "pid": 1336754, "tid": 1336754, "ts": 1295652043495.472, "dur": 31.962, "args": { "External id": 23969,"Record function id": 0, "Concrete Inputs": ["", "", "1."], "Input type": ["float", "", "Scalar"], "Input Strides": [[], [], []], "Input Dims": [[], [], []], "Ev Idx": 11320 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652043499.449, "dur": 0.704, "args": { "External id": 23970,"Record function id": 0, "Concrete Inputs": ["", "6", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], []], "Input Dims": [[], [], [], [], []], "Ev Idx": 11321 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::to", "pid": 1336754, "tid": 1336754, "ts": 1295652043548.640, "dur": 0.387, "args": { "External id": 23971,"Record function id": 0, "Concrete Inputs": ["", "6", "0", "", "", "False", "False", ""], "Input type": ["float", "Scalar", "Scalar", "", "", "Scalar", "Scalar", ""], "Input Strides": [[], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], []], "Ev Idx": 11322 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336754, "tid": 1336754, "ts": 1295652043667.948, "dur": 856.787, "args": { "External id": 23972,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11323 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_mul_", "pid": 1336754, "tid": 1336754, "ts": 1295652044204.556, "dur": 288.127, "args": { "External id": 23973,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["TensorList", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11324 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isnan", "pid": 1336754, "tid": 1336754, "ts": 1295652044572.033, "dur": 29.461, "args": { "External id": 23974,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11325 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::ne", "pid": 1336754, "tid": 1336754, "ts": 1295652044575.463, "dur": 25.383, "args": { "External id": 23975,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11326 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1336754, "ts": 1295652044605.097, "dur": 198.366, "args": { "External id": 23976,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11327 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295652044606.686, "dur": 196.565, "args": { "External id": 23977,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11328 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295652044608.737, "dur": 194.156, "args": { "External id": 23978,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11329 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::isinf", "pid": 1336754, "tid": 1336754, "ts": 1295652044808.781, "dur": 59.892, "args": { "External id": 23979,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11330 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295652044811.390, "dur": 34.388, "args": { "External id": 23980,"Record function id": 0, "Concrete Inputs": [""], "Input type": ["float"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11331 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::empty", "pid": 1336754, "tid": 1336754, "ts": 1295652044818.968, "dur": 2.992, "args": { "External id": 23981,"Record function id": 0, "Concrete Inputs": ["[0]", "6", "0", "", "", ""], "Input type": ["ScalarList", "Scalar", "Scalar", "", "", ""], "Input Strides": [[], [], [], [], [], []], "Input Dims": [[], [], [], [], [], []], "Ev Idx": 11332 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::abs", "pid": 1336754, "tid": 1336754, "ts": 1295652044823.688, "dur": 21.726, "args": { "External id": 23982,"Record function id": 0, "Concrete Inputs": ["", ""], "Input type": ["float", "float"], "Input Strides": [[], [1]], "Input Dims": [[], [0]], "Ev Idx": 11333 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::resize_", "pid": 1336754, "tid": 1336754, "ts": 1295652044828.286, "dur": 2.601, "args": { "External id": 23983,"Record function id": 0, "Concrete Inputs": ["", "[]", ""], "Input type": ["float", "ScalarList", ""], "Input Strides": [[1], [], []], "Input Dims": [[0], [], []], "Ev Idx": 11334 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::eq", "pid": 1336754, "tid": 1336754, "ts": 1295652044847.501, "dur": 20.398, "args": { "External id": 23984,"Record function id": 0, "Concrete Inputs": ["", "inf"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11335 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::is_nonzero", "pid": 1336754, "tid": 1336754, "ts": 1295652044870.738, "dur": 36.655, "args": { "External id": 23985,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11336 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::item", "pid": 1336754, "tid": 1336754, "ts": 1295652044873.855, "dur": 33.396, "args": { "External id": 23986,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11337 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_local_scalar_dense", "pid": 1336754, "tid": 1336754, "ts": 1295652044874.855, "dur": 32.147, "args": { "External id": 23987,"Sequence number": 246778, "Fwd thread id": 0, "Record function id": 0, "Concrete Inputs": [""], "Input type": ["bool"], "Input Strides": [[]], "Input Dims": [[]], "Ev Idx": 11338 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#OptimizersContainer.step", "pid": 1336754, "tid": 1336754, "ts": 1295652044939.019, "dur": 6127.884, "args": { "External id": 23988,"Record function id": 0, "Ev Idx": 11339 } }, { "ph": "X", "cat": "user_annotation", "name": "Optimizer.step#AdamW.step", "pid": 1336754, "tid": 1336754, "ts": 1295652044970.914, "dur": 6070.089, "args": { "External id": 23989,"Record function id": 0, "Ev Idx": 11340 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_foreach_add_", "pid": 1336754, "tid": 1336754, "ts": 1295652046396.813, "dur": 296.502, "args": { "External id": 23990,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["TensorList", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11341 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046417.005, "dur": 1.055, "args": { "External id": 23991,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11342 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046419.305, "dur": 0.274, "args": { "External id": 23992,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11343 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046420.064, "dur": 0.330, "args": { "External id": 23993,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11344 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046420.839, "dur": 0.074, "args": { "External id": 23994,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11345 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046421.461, "dur": 0.088, "args": { "External id": 23995,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11346 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046421.872, "dur": 0.104, "args": { "External id": 23996,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11347 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046422.464, "dur": 0.096, "args": { "External id": 23997,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11348 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046422.937, "dur": 0.283, "args": { "External id": 23998,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11349 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046423.602, "dur": 0.069, "args": { "External id": 23999,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11350 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046423.938, "dur": 0.070, "args": { "External id": 24000,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11351 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046424.592, "dur": 0.243, "args": { "External id": 24001,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11352 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046425.332, "dur": 0.064, "args": { "External id": 24002,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11353 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046425.736, "dur": 0.066, "args": { "External id": 24003,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11354 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046426.272, "dur": 0.052, "args": { "External id": 24004,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11355 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046426.618, "dur": 0.071, "args": { "External id": 24005,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11356 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046427.152, "dur": 0.066, "args": { "External id": 24006,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11357 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046427.804, "dur": 0.064, "args": { "External id": 24007,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11358 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046428.210, "dur": 0.062, "args": { "External id": 24008,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11359 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046428.745, "dur": 0.062, "args": { "External id": 24009,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11360 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046429.130, "dur": 0.067, "args": { "External id": 24010,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11361 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046429.672, "dur": 0.070, "args": { "External id": 24011,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11362 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046430.177, "dur": 0.069, "args": { "External id": 24012,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11363 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046430.611, "dur": 0.062, "args": { "External id": 24013,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11364 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046431.219, "dur": 0.068, "args": { "External id": 24014,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11365 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046431.639, "dur": 0.065, "args": { "External id": 24015,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11366 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046432.053, "dur": 0.063, "args": { "External id": 24016,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11367 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046432.534, "dur": 0.060, "args": { "External id": 24017,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11368 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046433.005, "dur": 0.066, "args": { "External id": 24018,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11369 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046433.580, "dur": 0.067, "args": { "External id": 24019,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11370 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046434.220, "dur": 0.053, "args": { "External id": 24020,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11371 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046434.594, "dur": 0.096, "args": { "External id": 24021,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11372 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046435.170, "dur": 0.283, "args": { "External id": 24022,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11373 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046435.796, "dur": 0.062, "args": { "External id": 24023,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11374 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046436.303, "dur": 0.063, "args": { "External id": 24024,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11375 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046436.870, "dur": 0.065, "args": { "External id": 24025,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11376 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046437.310, "dur": 0.060, "args": { "External id": 24026,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11377 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046437.919, "dur": 0.067, "args": { "External id": 24027,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11378 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046438.390, "dur": 0.063, "args": { "External id": 24028,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11379 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046438.803, "dur": 0.300, "args": { "External id": 24029,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11380 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046439.475, "dur": 0.277, "args": { "External id": 24030,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11381 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046440.221, "dur": 0.062, "args": { "External id": 24031,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11382 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046440.844, "dur": 0.068, "args": { "External id": 24032,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11383 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046441.422, "dur": 0.066, "args": { "External id": 24033,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11384 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046441.859, "dur": 0.063, "args": { "External id": 24034,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11385 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046442.308, "dur": 0.093, "args": { "External id": 24035,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11386 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046442.737, "dur": 0.066, "args": { "External id": 24036,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11387 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046443.097, "dur": 0.065, "args": { "External id": 24037,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11388 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046443.859, "dur": 0.068, "args": { "External id": 24038,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11389 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046444.282, "dur": 0.061, "args": { "External id": 24039,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11390 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046444.883, "dur": 0.066, "args": { "External id": 24040,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11391 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046445.406, "dur": 0.069, "args": { "External id": 24041,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11392 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046446.149, "dur": 0.065, "args": { "External id": 24042,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11393 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046446.547, "dur": 0.073, "args": { "External id": 24043,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11394 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046447.160, "dur": 0.063, "args": { "External id": 24044,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11395 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046447.491, "dur": 0.049, "args": { "External id": 24045,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11396 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046448.300, "dur": 0.065, "args": { "External id": 24046,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11397 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046448.648, "dur": 0.050, "args": { "External id": 24047,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11398 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046449.616, "dur": 0.053, "args": { "External id": 24048,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11399 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046450.123, "dur": 0.066, "args": { "External id": 24049,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11400 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046450.955, "dur": 0.067, "args": { "External id": 24050,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11401 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046451.319, "dur": 0.052, "args": { "External id": 24051,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11402 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046451.986, "dur": 0.066, "args": { "External id": 24052,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11403 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046452.314, "dur": 0.054, "args": { "External id": 24053,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11404 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046453.283, "dur": 0.067, "args": { "External id": 24054,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11405 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046453.608, "dur": 0.051, "args": { "External id": 24055,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11406 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046454.216, "dur": 0.066, "args": { "External id": 24056,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11407 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046454.541, "dur": 0.051, "args": { "External id": 24057,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11408 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046455.326, "dur": 0.066, "args": { "External id": 24058,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11409 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046455.859, "dur": 0.070, "args": { "External id": 24059,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11410 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046456.447, "dur": 0.062, "args": { "External id": 24060,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11411 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046456.773, "dur": 0.053, "args": { "External id": 24061,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11412 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046457.593, "dur": 0.065, "args": { "External id": 24062,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11413 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046457.916, "dur": 0.048, "args": { "External id": 24063,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11414 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046458.770, "dur": 0.065, "args": { "External id": 24064,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11415 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046483.531, "dur": 0.137, "args": { "External id": 24065,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11416 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046484.317, "dur": 0.050, "args": { "External id": 24066,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11417 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046484.690, "dur": 0.053, "args": { "External id": 24067,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11418 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046485.527, "dur": 0.063, "args": { "External id": 24068,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11419 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046485.858, "dur": 0.051, "args": { "External id": 24069,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11420 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046486.707, "dur": 0.066, "args": { "External id": 24070,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11421 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046487.026, "dur": 0.052, "args": { "External id": 24071,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11422 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046487.772, "dur": 0.063, "args": { "External id": 24072,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11423 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046488.084, "dur": 0.050, "args": { "External id": 24073,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11424 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046488.740, "dur": 0.067, "args": { "External id": 24074,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11425 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046489.257, "dur": 0.068, "args": { "External id": 24075,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11426 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046489.881, "dur": 0.070, "args": { "External id": 24076,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11427 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046490.201, "dur": 0.050, "args": { "External id": 24077,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11428 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046491.016, "dur": 0.064, "args": { "External id": 24078,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11429 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046491.328, "dur": 0.055, "args": { "External id": 24079,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11430 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046492.124, "dur": 0.068, "args": { "External id": 24080,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11431 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046492.450, "dur": 0.062, "args": { "External id": 24081,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11432 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046493.020, "dur": 0.064, "args": { "External id": 24082,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11433 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046493.477, "dur": 0.063, "args": { "External id": 24083,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11434 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046494.137, "dur": 0.053, "args": { "External id": 24084,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11435 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046494.452, "dur": 0.050, "args": { "External id": 24085,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11436 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046495.041, "dur": 0.065, "args": { "External id": 24086,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11437 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046495.367, "dur": 0.054, "args": { "External id": 24087,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11438 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046495.927, "dur": 0.065, "args": { "External id": 24088,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11439 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046496.257, "dur": 0.050, "args": { "External id": 24089,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11440 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046496.843, "dur": 0.067, "args": { "External id": 24090,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11441 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046497.264, "dur": 0.070, "args": { "External id": 24091,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11442 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046497.877, "dur": 0.066, "args": { "External id": 24092,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11443 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046498.202, "dur": 0.051, "args": { "External id": 24093,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11444 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046498.772, "dur": 0.064, "args": { "External id": 24094,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11445 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046499.099, "dur": 0.053, "args": { "External id": 24095,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11446 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046499.687, "dur": 0.066, "args": { "External id": 24096,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11447 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046500.020, "dur": 0.053, "args": { "External id": 24097,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11448 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046500.817, "dur": 0.064, "args": { "External id": 24098,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11449 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046501.146, "dur": 0.053, "args": { "External id": 24099,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11450 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046501.947, "dur": 0.066, "args": { "External id": 24100,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11451 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046502.277, "dur": 0.052, "args": { "External id": 24101,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11452 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046503.208, "dur": 0.063, "args": { "External id": 24102,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11453 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046503.533, "dur": 0.079, "args": { "External id": 24103,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11454 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046504.365, "dur": 0.066, "args": { "External id": 24104,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11455 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046504.696, "dur": 0.051, "args": { "External id": 24105,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11456 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046505.525, "dur": 0.067, "args": { "External id": 24106,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11457 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046505.853, "dur": 0.056, "args": { "External id": 24107,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11458 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046506.423, "dur": 0.067, "args": { "External id": 24108,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11459 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046506.781, "dur": 0.054, "args": { "External id": 24109,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11460 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046507.584, "dur": 0.067, "args": { "External id": 24110,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11461 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046507.918, "dur": 0.055, "args": { "External id": 24111,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11462 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046508.478, "dur": 0.068, "args": { "External id": 24112,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11463 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046508.999, "dur": 0.069, "args": { "External id": 24113,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11464 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046509.695, "dur": 0.071, "args": { "External id": 24114,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11465 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046510.029, "dur": 0.050, "args": { "External id": 24115,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11466 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046510.588, "dur": 0.064, "args": { "External id": 24116,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11467 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046510.915, "dur": 0.051, "args": { "External id": 24117,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11468 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046516.203, "dur": 0.073, "args": { "External id": 24118,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11469 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046516.592, "dur": 0.054, "args": { "External id": 24119,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11470 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046518.381, "dur": 0.063, "args": { "External id": 24120,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11471 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046518.707, "dur": 0.052, "args": { "External id": 24121,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11472 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046519.516, "dur": 0.067, "args": { "External id": 24122,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11473 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046519.830, "dur": 0.049, "args": { "External id": 24123,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11474 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046520.445, "dur": 0.068, "args": { "External id": 24124,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11475 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046520.763, "dur": 0.053, "args": { "External id": 24125,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11476 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046521.399, "dur": 0.067, "args": { "External id": 24126,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11477 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046521.714, "dur": 0.051, "args": { "External id": 24127,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11478 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046522.251, "dur": 0.064, "args": { "External id": 24128,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11479 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046522.582, "dur": 0.058, "args": { "External id": 24129,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11480 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046523.383, "dur": 0.065, "args": { "External id": 24130,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11481 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046523.695, "dur": 0.057, "args": { "External id": 24131,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11482 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046524.252, "dur": 0.067, "args": { "External id": 24132,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11483 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046524.579, "dur": 0.055, "args": { "External id": 24133,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11484 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046525.112, "dur": 0.067, "args": { "External id": 24134,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11485 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046525.437, "dur": 0.048, "args": { "External id": 24135,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11486 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046526.208, "dur": 0.068, "args": { "External id": 24136,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11487 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046526.545, "dur": 0.056, "args": { "External id": 24137,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11488 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046527.105, "dur": 0.067, "args": { "External id": 24138,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11489 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046527.432, "dur": 0.054, "args": { "External id": 24139,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11490 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046528.018, "dur": 0.067, "args": { "External id": 24140,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11491 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046528.378, "dur": 0.052, "args": { "External id": 24141,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11492 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046528.981, "dur": 0.064, "args": { "External id": 24142,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11493 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046529.306, "dur": 0.055, "args": { "External id": 24143,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11494 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046529.910, "dur": 0.068, "args": { "External id": 24144,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11495 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046530.238, "dur": 0.063, "args": { "External id": 24145,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11496 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046530.947, "dur": 0.065, "args": { "External id": 24146,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11497 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046531.273, "dur": 0.054, "args": { "External id": 24147,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11498 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046531.994, "dur": 0.063, "args": { "External id": 24148,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11499 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046532.318, "dur": 0.054, "args": { "External id": 24149,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11500 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046533.470, "dur": 0.068, "args": { "External id": 24150,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11501 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046533.795, "dur": 0.050, "args": { "External id": 24151,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11502 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046534.385, "dur": 0.066, "args": { "External id": 24152,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11503 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046534.709, "dur": 0.056, "args": { "External id": 24153,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11504 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046535.330, "dur": 0.071, "args": { "External id": 24154,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11505 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046535.657, "dur": 0.050, "args": { "External id": 24155,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11506 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046536.271, "dur": 0.067, "args": { "External id": 24156,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11507 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046536.591, "dur": 0.057, "args": { "External id": 24157,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11508 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046537.181, "dur": 0.068, "args": { "External id": 24158,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11509 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046537.537, "dur": 0.052, "args": { "External id": 24159,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11510 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046538.138, "dur": 0.067, "args": { "External id": 24160,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11511 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046538.475, "dur": 0.055, "args": { "External id": 24161,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11512 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046539.018, "dur": 0.065, "args": { "External id": 24162,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11513 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046539.344, "dur": 0.050, "args": { "External id": 24163,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11514 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046539.941, "dur": 0.068, "args": { "External id": 24164,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11515 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046540.366, "dur": 0.066, "args": { "External id": 24165,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11516 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046541.261, "dur": 0.066, "args": { "External id": 24166,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11517 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046541.591, "dur": 0.051, "args": { "External id": 24167,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11518 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046542.176, "dur": 0.067, "args": { "External id": 24168,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11519 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046542.501, "dur": 0.053, "args": { "External id": 24169,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11520 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046543.176, "dur": 0.068, "args": { "External id": 24170,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11521 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046543.505, "dur": 0.055, "args": { "External id": 24171,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11522 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046544.061, "dur": 0.066, "args": { "External id": 24172,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11523 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046544.383, "dur": 0.054, "args": { "External id": 24173,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11524 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046544.951, "dur": 0.066, "args": { "External id": 24174,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11525 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046545.367, "dur": 0.071, "args": { "External id": 24175,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11526 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046546.087, "dur": 0.061, "args": { "External id": 24176,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11527 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046546.407, "dur": 0.079, "args": { "External id": 24177,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11528 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046547.014, "dur": 0.065, "args": { "External id": 24178,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11529 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046547.344, "dur": 0.052, "args": { "External id": 24179,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11530 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046547.910, "dur": 0.064, "args": { "External id": 24180,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11531 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046548.237, "dur": 0.050, "args": { "External id": 24181,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11532 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046548.801, "dur": 0.065, "args": { "External id": 24182,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11533 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046549.137, "dur": 0.051, "args": { "External id": 24183,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11534 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046549.927, "dur": 0.063, "args": { "External id": 24184,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11535 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046550.251, "dur": 0.053, "args": { "External id": 24185,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11536 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046550.851, "dur": 0.063, "args": { "External id": 24186,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11537 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046551.181, "dur": 0.055, "args": { "External id": 24187,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11538 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046551.948, "dur": 0.067, "args": { "External id": 24188,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11539 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046552.272, "dur": 0.055, "args": { "External id": 24189,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11540 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046552.819, "dur": 0.066, "args": { "External id": 24190,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11541 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046553.187, "dur": 0.052, "args": { "External id": 24191,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11542 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046553.950, "dur": 0.061, "args": { "External id": 24192,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11543 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046554.274, "dur": 0.054, "args": { "External id": 24193,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11544 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046555.044, "dur": 0.069, "args": { "External id": 24194,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11545 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046555.373, "dur": 0.053, "args": { "External id": 24195,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11546 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046556.177, "dur": 0.070, "args": { "External id": 24196,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11547 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046556.503, "dur": 0.054, "args": { "External id": 24197,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11548 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046557.311, "dur": 0.063, "args": { "External id": 24198,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11549 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046557.638, "dur": 0.066, "args": { "External id": 24199,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11550 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046558.483, "dur": 0.067, "args": { "External id": 24200,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11551 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046558.813, "dur": 0.056, "args": { "External id": 24201,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11552 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046559.405, "dur": 0.071, "args": { "External id": 24202,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11553 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046559.737, "dur": 0.056, "args": { "External id": 24203,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11554 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046560.314, "dur": 0.069, "args": { "External id": 24204,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11555 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046560.643, "dur": 0.053, "args": { "External id": 24205,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11556 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046561.243, "dur": 0.067, "args": { "External id": 24206,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11557 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046561.570, "dur": 0.055, "args": { "External id": 24207,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11558 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046562.188, "dur": 0.068, "args": { "External id": 24208,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11559 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046562.516, "dur": 0.051, "args": { "External id": 24209,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11560 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046563.302, "dur": 0.065, "args": { "External id": 24210,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11561 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046563.623, "dur": 0.078, "args": { "External id": 24211,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11562 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046564.487, "dur": 0.063, "args": { "External id": 24212,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11563 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046564.809, "dur": 0.054, "args": { "External id": 24213,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11564 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046565.534, "dur": 0.069, "args": { "External id": 24214,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11565 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046565.859, "dur": 0.051, "args": { "External id": 24215,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11566 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046566.592, "dur": 0.068, "args": { "External id": 24216,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11567 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046567.141, "dur": 0.074, "args": { "External id": 24217,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11568 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046567.920, "dur": 0.073, "args": { "External id": 24218,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11569 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046568.292, "dur": 0.050, "args": { "External id": 24219,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11570 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046569.004, "dur": 0.067, "args": { "External id": 24220,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11571 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046569.334, "dur": 0.054, "args": { "External id": 24221,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11572 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046570.053, "dur": 0.065, "args": { "External id": 24222,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11573 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046570.392, "dur": 0.053, "args": { "External id": 24223,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11574 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046571.161, "dur": 0.067, "args": { "External id": 24224,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11575 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046571.489, "dur": 0.056, "args": { "External id": 24225,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11576 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046572.037, "dur": 0.068, "args": { "External id": 24226,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11577 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046572.363, "dur": 0.055, "args": { "External id": 24227,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11578 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046573.149, "dur": 0.067, "args": { "External id": 24228,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11579 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046573.462, "dur": 0.055, "args": { "External id": 24229,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11580 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046574.040, "dur": 0.064, "args": { "External id": 24230,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11581 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046574.348, "dur": 0.054, "args": { "External id": 24231,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11582 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046575.127, "dur": 0.062, "args": { "External id": 24232,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11583 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046575.433, "dur": 0.051, "args": { "External id": 24233,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11584 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046576.021, "dur": 0.064, "args": { "External id": 24234,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11585 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046576.351, "dur": 0.051, "args": { "External id": 24235,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11586 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046576.963, "dur": 0.072, "args": { "External id": 24236,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11587 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046577.322, "dur": 0.054, "args": { "External id": 24237,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11588 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046577.928, "dur": 0.066, "args": { "External id": 24238,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11589 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046578.259, "dur": 0.057, "args": { "External id": 24239,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11590 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046578.854, "dur": 0.068, "args": { "External id": 24240,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11591 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046579.182, "dur": 0.052, "args": { "External id": 24241,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11592 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046579.753, "dur": 0.073, "args": { "External id": 24242,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11593 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046580.082, "dur": 0.057, "args": { "External id": 24243,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11594 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046580.898, "dur": 0.063, "args": { "External id": 24244,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11595 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046581.221, "dur": 0.050, "args": { "External id": 24245,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11596 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046581.989, "dur": 0.064, "args": { "External id": 24246,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11597 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046582.313, "dur": 0.055, "args": { "External id": 24247,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11598 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046582.884, "dur": 0.065, "args": { "External id": 24248,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11599 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046583.209, "dur": 0.053, "args": { "External id": 24249,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11600 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046583.875, "dur": 0.065, "args": { "External id": 24250,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11601 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046584.201, "dur": 0.060, "args": { "External id": 24251,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11602 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046585.004, "dur": 0.070, "args": { "External id": 24252,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11603 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046585.334, "dur": 0.055, "args": { "External id": 24253,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11604 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046585.889, "dur": 0.069, "args": { "External id": 24254,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11605 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046586.210, "dur": 0.078, "args": { "External id": 24255,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11606 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046587.016, "dur": 0.066, "args": { "External id": 24256,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11607 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046587.341, "dur": 0.055, "args": { "External id": 24257,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11608 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046588.008, "dur": 0.070, "args": { "External id": 24258,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11609 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046588.334, "dur": 0.053, "args": { "External id": 24259,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11610 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046588.894, "dur": 0.068, "args": { "External id": 24260,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11611 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046589.222, "dur": 0.054, "args": { "External id": 24261,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11612 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046589.957, "dur": 0.065, "args": { "External id": 24262,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11613 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046590.322, "dur": 0.049, "args": { "External id": 24263,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11614 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046591.131, "dur": 0.063, "args": { "External id": 24264,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11615 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046591.462, "dur": 0.058, "args": { "External id": 24265,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11616 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046592.201, "dur": 0.070, "args": { "External id": 24266,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11617 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046592.535, "dur": 0.050, "args": { "External id": 24267,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11618 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046593.303, "dur": 0.064, "args": { "External id": 24268,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11619 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046593.627, "dur": 0.051, "args": { "External id": 24269,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11620 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046594.312, "dur": 0.060, "args": { "External id": 24270,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11621 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046594.636, "dur": 0.049, "args": { "External id": 24271,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11622 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046595.181, "dur": 0.062, "args": { "External id": 24272,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11623 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046595.506, "dur": 0.051, "args": { "External id": 24273,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11624 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046596.315, "dur": 0.072, "args": { "External id": 24274,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11625 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046596.645, "dur": 0.048, "args": { "External id": 24275,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11626 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046597.461, "dur": 0.070, "args": { "External id": 24276,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11627 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046597.789, "dur": 0.049, "args": { "External id": 24277,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11628 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046598.542, "dur": 0.069, "args": { "External id": 24278,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11629 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046598.896, "dur": 0.051, "args": { "External id": 24279,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11630 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046599.467, "dur": 0.062, "args": { "External id": 24280,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11631 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::result_type", "pid": 1336754, "tid": 1336754, "ts": 1295652046599.775, "dur": 0.063, "args": { "External id": 24281,"Record function id": 0, "Concrete Inputs": ["", "1"], "Input type": ["float", "Scalar"], "Input Strides": [[], []], "Input Dims": [[], []], "Ev Idx": 11632 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336754, "tid": 1336754, "ts": 1295652047226.430, "dur": 3688.643, "args": { "External id": 24282,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11633 } }, { "ph": "X", "cat": "cpu_op", "name": "aten::_fused_adamw_", "pid": 1336754, "tid": 1336754, "ts": 1295652050417.465, "dur": 334.291, "args": { "External id": 24283,"Record function id": 0, "Concrete Inputs": ["", "", "", "", "", "", "0.0001023488255872064", "0.90000000000000002", "0.94999999999999996", "0.10000000000000001", "1.0000000000000001e-15", "False", "False", "", ""], "Input type": ["TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "TensorList", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "Scalar", "", ""], "Input Strides": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Input Dims": [[], [], [], [], [], [], [], [], [], [], [], [], [], [], []], "Ev Idx": 11634 } }, { "name": "process_name", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 0, "args": { "name": "python3.12" } }, { "name": "process_labels", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 0, "args": { "labels": "CPU" } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 0, "args": { "sort_index": 1336754 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1381179, "args": { "name": "thread 1381179 (pt_autograd_1)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1381179, "args": { "sort_index": 1381179 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1381179, "args": { "name": "thread 1381179 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1381179, "args": { "sort_index": 1381179 } }, { "name": "thread_name", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1336754, "args": { "name": "thread 1336754 (python3.12)" } }, { "name": "thread_sort_index", "ph": "M", "ts": 1295649886385.744, "pid": 1336754, "tid": 1336754, "args": { "sort_index": 1336754 } }, { "ph": "X", "cat": "Trace", "ts": 1295649886320.355, "dur": 2166350.690, "pid": "Spans", "tid": "PyTorch Profiler", "name": "PyTorch Profiler (0)", "args": { "Op count": 0 } }, { "name": "process_sort_index", "ph": "M", "ts": 1295649886320.355, "pid": "Spans", "tid": 0, "args": { "sort_index": 536870912 } }, { "name": "Iteration Start: PyTorch Profiler", "ph": "i", "s": "g", "pid": "Traces", "tid": "Trace PyTorch Profiler", "ts": 1295649886320.355 }, { "name": "Record Window End", "ph": "i", "s": "g", "pid": "", "tid": "", "ts": 1295652113863.384 } ], "traceName": "exp/mtp.1B.batch16.seqlen4096.context4096.warmup2000.update1.steps200000.lr2e-4.cosine/profile_trace/iteration_1024/rank1_trace.json", "displayTimeUnit": "ms", "baseTimeNanoseconds": 1751410836000000000 }